[{"key": "35232142", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.3830641873503641, "ground_truth": 0}, {"key": "35232142", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5117166061468714, "ground_truth": 0}, {"key": "35232142", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5563995698301696, "ground_truth": 0}, {"key": "35232142", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591092494024, "ground_truth": 0}, {"key": "35232142", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381319505242, "ground_truth": 0}, {"key": "40143035", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666577247222, "ground_truth": 0}, {"key": "40143035", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6584174919458806, "ground_truth": 0}, {"key": "40143035", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8210441174887421, "ground_truth": 0}, {"key": "40143035", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867842126452, "ground_truth": 0}, {"key": "40143035", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.798186784650415, "ground_truth": 0}, {"key": "35951548", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8976952948978507, "ground_truth": 0}, {"key": "35951548", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8991213756307378, "ground_truth": 0}, {"key": "35951548", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388106232064, "ground_truth": 0}, {"key": "35951548", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.674050496504847, "ground_truth": 0}, {"key": "35951548", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251135252381, "ground_truth": 0}, {"key": "36266422", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5983122019422176, "ground_truth": 0}, {"key": "36266422", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7676898685500263, "ground_truth": 0}, {"key": "36266422", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7341195196745507, "ground_truth": 0}, {"key": "36266422", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527638190955, "ground_truth": 0}, {"key": "36266422", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948050027998, "ground_truth": 0}, {"key": "38826984", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5448013934790849, "ground_truth": 0}, {"key": "38826984", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6406358429404104, "ground_truth": 0}, {"key": "38826984", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6774740246972197, "ground_truth": 0}, {"key": "38826984", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432322744199, "ground_truth": 0}, {"key": "38826984", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137281697561, "ground_truth": 0}, {"key": "34540833", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8568123014992987, "ground_truth": 0}, {"key": "34540833", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8697145853962118, "ground_truth": 0}, {"key": "34540833", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8864204063956972, "ground_truth": 0}, {"key": "34540833", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672246071567, "ground_truth": 0}, {"key": "34540833", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163666401682, "ground_truth": 0}, {"key": "20836172", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744754319536, "ground_truth": 0}, {"key": "20836172", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7745833925109707, "ground_truth": 0}, {"key": "20836172", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8469578367497804, "ground_truth": 0}, {"key": "20836172", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.726425622024197, "ground_truth": 0}, {"key": "20836172", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.675764620820595, "ground_truth": 0}, {"key": "35932467", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648915877311107, "ground_truth": 0}, {"key": "35932467", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7839884616100907, "ground_truth": 0}, {"key": "35932467", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7592254226490078, "ground_truth": 0}, {"key": "35932467", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593445051754, "ground_truth": 0}, {"key": "35932467", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982193377297, "ground_truth": 0}, {"key": "40758845", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8976953085222061, "ground_truth": 0}, {"key": "40758845", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.834406884262132, "ground_truth": 0}, {"key": "40758845", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8902942291636629, "ground_truth": 0}, {"key": "40758845", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366467409799, "ground_truth": 0}, {"key": "40758845", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104470055327, "ground_truth": 0}, {"key": "30358490", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673262204068, "ground_truth": 0}, {"key": "30358490", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7648916040461495, "ground_truth": 0}, {"key": "30358490", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8080672154654969, "ground_truth": 0}, {"key": "30358490", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581566907115, "ground_truth": 0}, {"key": "30358490", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149138850505, "ground_truth": 0}, {"key": "34615665", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9155072425887284, "ground_truth": 0}, {"key": "34615665", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8856314717031789, "ground_truth": 0}, {"key": "34615665", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9252299455572812, "ground_truth": 0}, {"key": "34615665", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9763105317380604, "ground_truth": 0}, {"key": "34615665", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9319595792708875, "ground_truth": 0}, {"key": "35890902", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7853086036425597, "ground_truth": 0}, {"key": "35890902", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7416740093612649, "ground_truth": 0}, {"key": "35890902", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8128673135612354, "ground_truth": 0}, {"key": "35890902", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723658452591, "ground_truth": 0}, {"key": "35890902", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118957892425, "ground_truth": 0}, {"key": "37922330", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.653126937168719, "ground_truth": 0}, {"key": "37922330", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5640985036365905, "ground_truth": 0}, {"key": "37922330", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7879312052252819, "ground_truth": 0}, {"key": "37922330", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876300126887644, "ground_truth": 0}, {"key": "37922330", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928839922783, "ground_truth": 0}, {"key": "30844962", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074046822861156, "ground_truth": 0}, {"key": "30844962", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6169358078493212, "ground_truth": 0}, {"key": "30844962", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7025300505862891, "ground_truth": 0}, {"key": "30844962", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241632057133, "ground_truth": 0}, {"key": "30844962", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026692847998, "ground_truth": 0}, {"key": "36217333", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6477982059015052, "ground_truth": 0}, {"key": "36217333", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6001883659871947, "ground_truth": 0}, {"key": "36217333", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297746292921528, "ground_truth": 0}, {"key": "36217333", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241628201975, "ground_truth": 0}, {"key": "36217333", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381476531782, "ground_truth": 0}, {"key": "30816523", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8164063804968926, "ground_truth": 0}, {"key": "30816523", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7634837704725833, "ground_truth": 0}, {"key": "30816523", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7905303267827664, "ground_truth": 0}, {"key": "30816523", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701001954822, "ground_truth": 0}, {"key": "30816523", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366000489657, "ground_truth": 0}, {"key": "38900884", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8438951093358439, "ground_truth": 0}, {"key": "38900884", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8499711876747571, "ground_truth": 0}, {"key": "38900884", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8509647090343152, "ground_truth": 0}, {"key": "38900884", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228384755936, "ground_truth": 0}, {"key": "38900884", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.779992901468926, "ground_truth": 0}, {"key": "13890581", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7839884607266738, "ground_truth": 0}, {"key": "13890581", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5736783839450458, "ground_truth": 0}, {"key": "13890581", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7879311807221807, "ground_truth": 0}, {"key": "13890581", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835331931191, "ground_truth": 0}, {"key": "13890581", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307600807692, "ground_truth": 0}, {"key": "40194700", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7879311862074042, "ground_truth": 0}, {"key": "40194700", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354672495476, "ground_truth": 0}, {"key": "40194700", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8449215274450368, "ground_truth": 0}, {"key": "40194700", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297937021473, "ground_truth": 0}, {"key": "40194700", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755710005132, "ground_truth": 0}, {"key": "37903647", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5525397246779935, "ground_truth": 0}, {"key": "37903647", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.723309482972797, "ground_truth": 0}, {"key": "37903647", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5195213140923154, "ground_truth": 0}, {"key": "37903647", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291149329397, "ground_truth": 0}, {"key": "37903647", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224855189499, "ground_truth": 0}, {"key": "13291223", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8044059062820834, "ground_truth": 0}, {"key": "13291223", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6442250957907577, "ground_truth": 0}, {"key": "13291223", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7310585834860389, "ground_truth": 0}, {"key": "13291223", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325263709612, "ground_truth": 0}, {"key": "13291223", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916174553361, "ground_truth": 0}, {"key": "36052570", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.615087835858605, "ground_truth": 0}, {"key": "36052570", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6279512090011353, "ground_truth": 0}, {"key": "36052570", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7185943939343198, "ground_truth": 0}, {"key": "36052570", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.613236577060013, "ground_truth": 0}, {"key": "36052570", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197731952656, "ground_truth": 0}, {"key": "34944735", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8577681177908439, "ground_truth": 0}, {"key": "34944735", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9184802545834215, "ground_truth": 0}, {"key": "34944735", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.891811045441653, "ground_truth": 0}, {"key": "34944735", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215301338886, "ground_truth": 0}, {"key": "34944735", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206751054086, "ground_truth": 0}, {"key": "32159602", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6636689297191541, "ground_truth": 0}, {"key": "32159602", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7969253899977314, "ground_truth": 0}, {"key": "32159602", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6943026692099351, "ground_truth": 0}, {"key": "32159602", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943820271525, "ground_truth": 0}, {"key": "32159602", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254004221359, "ground_truth": 0}, {"key": "34988915", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8140527967424527, "ground_truth": 0}, {"key": "34988915", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998620029048, "ground_truth": 0}, {"key": "34988915", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431679785912254, "ground_truth": 0}, {"key": "34988915", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253566539232, "ground_truth": 0}, {"key": "34988915", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159699849473, "ground_truth": 0}, {"key": "37889203", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8799743649228929, "ground_truth": 0}, {"key": "37889203", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8918110395379987, "ground_truth": 0}, {"key": "37889203", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8749346155094712, "ground_truth": 0}, {"key": "37889203", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846351227049, "ground_truth": 0}, {"key": "37889203", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767934294392, "ground_truth": 0}, {"key": "33609927", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8479677511065566, "ground_truth": 0}, {"key": "33609927", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528105530965, "ground_truth": 0}, {"key": "33609927", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506356405335, "ground_truth": 0}, {"key": "33609927", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619453668274, "ground_truth": 0}, {"key": "33609927", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281659314991, "ground_truth": 0}, {"key": "33578778", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.689305622919123, "ground_truth": 0}, {"key": "33578778", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7879311946877086, "ground_truth": 0}, {"key": "33578778", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094837697978, "ground_truth": 0}, {"key": "33578778", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105351057955, "ground_truth": 0}, {"key": "33578778", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666392075272, "ground_truth": 0}, {"key": "36888270", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8548846481186265, "ground_truth": 0}, {"key": "36888270", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6057990428424, "ground_truth": 0}, {"key": "36888270", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253748468705, "ground_truth": 0}, {"key": "36888270", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867790283619, "ground_truth": 0}, {"key": "36888270", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089290105014, "ground_truth": 0}, {"key": "36846007", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9489172574733935, "ground_truth": 0}, {"key": "36846007", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9632305322387708, "ground_truth": 0}, {"key": "36846007", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9597620573539999, "ground_truth": 0}, {"key": "36846007", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9600626871068136, "ground_truth": 0}, {"key": "36846007", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9585377258282246, "ground_truth": 0}, {"key": "31723471", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.697608913020356, "ground_truth": 0}, {"key": "31723471", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7866228483416134, "ground_truth": 0}, {"key": "31723471", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.763483780377971, "ground_truth": 0}, {"key": "31723471", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842639998933275, "ground_truth": 0}, {"key": "31723471", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358414134247, "ground_truth": 0}, {"key": "15921828", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6976089080457486, "ground_truth": 0}, {"key": "15921828", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.647798222303489, "ground_truth": 0}, {"key": "15921828", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544457541231, "ground_truth": 0}, {"key": "15921828", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094692510585, "ground_truth": 0}, {"key": "15921828", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175068714101, "ground_truth": 0}, {"key": "39109408", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5717665995462381, "ground_truth": 0}, {"key": "39109408", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6206216097365757, "ground_truth": 0}, {"key": "39109408", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6654105731363734, "ground_truth": 0}, {"key": "39109408", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796728478657, "ground_truth": 0}, {"key": "39109408", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.598312209618443, "ground_truth": 0}, {"key": "20936833", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5774953640305366, "ground_truth": 0}, {"key": "20936833", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5078118797390422, "ground_truth": 0}, {"key": "20936833", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.505859078227344, "ground_truth": 0}, {"key": "20936833", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646082984439, "ground_truth": 0}, {"key": "20936833", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.3998116277062659, "ground_truth": 0}, {"key": "36832879", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6039318422220883, "ground_truth": 0}, {"key": "36832879", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.548673499077201, "ground_truth": 0}, {"key": "36832879", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5175708928800523, "ground_truth": 0}, {"key": "36832879", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324583914163, "ground_truth": 0}, {"key": "36832879", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631928504432, "ground_truth": 0}, {"key": "14958201", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9207896682542287, "ground_truth": 0}, {"key": "14958201", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8933094129706733, "ground_truth": 0}, {"key": "14958201", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8509646994474279, "ground_truth": 0}, {"key": "14958201", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072418878382, "ground_truth": 0}, {"key": "14958201", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206787940426, "ground_truth": 0}, {"key": "34352262", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5117165880099585, "ground_truth": 0}, {"key": "34352262", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850410934081, "ground_truth": 0}, {"key": "34352262", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6406358741231352, "ground_truth": 0}, {"key": "34352262", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943037773313, "ground_truth": 0}, {"key": "34352262", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615948166372, "ground_truth": 0}, {"key": "39805395", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.40544870683153933, "ground_truth": 0}, {"key": "39805395", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5467381424423328, "ground_truth": 0}, {"key": "39805395", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7057850400375738, "ground_truth": 0}, {"key": "39805395", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.731058591506827, "ground_truth": 0}, {"key": "39805395", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746046565478, "ground_truth": 0}, {"key": "34303109", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6992544259535373, "ground_truth": 0}, {"key": "34303109", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6477982008946552, "ground_truth": 0}, {"key": "34303109", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6388352982556769, "ground_truth": 0}, {"key": "34303109", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.69264199443661, "ground_truth": 0}, {"key": "34303109", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283045219493, "ground_truth": 0}, {"key": "39939090", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163765151273, "ground_truth": 0}, {"key": "39939090", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7690802441055934, "ground_truth": 0}, {"key": "39939090", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8469578505395807, "ground_truth": 0}, {"key": "39939090", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528126488212, "ground_truth": 0}, {"key": "39939090", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.721743213206644, "ground_truth": 0}, {"key": "29347771", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7676898684642988, "ground_truth": 0}, {"key": "29347771", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267117980596876, "ground_truth": 0}, {"key": "29347771", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228352470923, "ground_truth": 0}, {"key": "29347771", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933238308737, "ground_truth": 0}, {"key": "29347771", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218469369407, "ground_truth": 0}, {"key": "36783415", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8887587959299762, "ground_truth": 0}, {"key": "36783415", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7386690707602589, "ground_truth": 0}, {"key": "36783415", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8244619365366369, "ground_truth": 0}, {"key": "36783415", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.753466681226418, "ground_truth": 0}, {"key": "36783415", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441197848848, "ground_truth": 0}, {"key": "37935687", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8799743681700098, "ground_truth": 0}, {"key": "37935687", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8872045947602327, "ground_truth": 0}, {"key": "37935687", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8969755834930648, "ground_truth": 0}, {"key": "37935687", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9319595824974152, "ground_truth": 0}, {"key": "37935687", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9289263247683299, "ground_truth": 0}, {"key": "40260829", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7994423234926122, "ground_truth": 0}, {"key": "40260829", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8056321837137725, "ground_truth": 0}, {"key": "40260829", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8606036218448772, "ground_truth": 0}, {"key": "40260829", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346126868871, "ground_truth": 0}, {"key": "40260829", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424496492897, "ground_truth": 0}, {"key": "36478199", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673204890436, "ground_truth": 0}, {"key": "36478199", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7786493082108589, "ground_truth": 0}, {"key": "36478199", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.838679769672725, "ground_truth": 0}, {"key": "36478199", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544116611759, "ground_truth": 0}, {"key": "36478199", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377731687114, "ground_truth": 0}, {"key": "34541803", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8198933376936697, "ground_truth": 0}, {"key": "34541803", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6601723583987588, "ground_truth": 0}, {"key": "34541803", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8210441127482716, "ground_truth": 0}, {"key": "34541803", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325295443855, "ground_truth": 0}, {"key": "34541803", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199592122018, "ground_truth": 0}, {"key": "35360841", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797587162409, "ground_truth": 0}, {"key": "35360841", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8799743723823515, "ground_truth": 0}, {"key": "35360841", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8164063723418533, "ground_truth": 0}, {"key": "35360841", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142395975068, "ground_truth": 0}, {"key": "35360841", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068890733486, "ground_truth": 0}, {"key": "35550407", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7185943888677125, "ground_truth": 0}, {"key": "35550407", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6279511893908118, "ground_truth": 0}, {"key": "35550407", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5486734920697185, "ground_truth": 0}, {"key": "35550407", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872045571798, "ground_truth": 0}, {"key": "35550407", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804092573711, "ground_truth": 0}, {"key": "37561590", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6992543901770713, "ground_truth": 0}, {"key": "37561590", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998546333888, "ground_truth": 0}, {"key": "37561590", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8221891407004844, "ground_truth": 0}, {"key": "37561590", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.793105948297389, "ground_truth": 0}, {"key": "37561590", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163563228273, "ground_truth": 0}, {"key": "39328843", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9046505361065036, "ground_truth": 0}, {"key": "39328843", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.927363296952922, "ground_truth": 0}, {"key": "39328843", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9178933698703021, "ground_truth": 0}, {"key": "39328843", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9142907266190252, "ground_truth": 0}, {"key": "39328843", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107938526221, "ground_truth": 0}, {"key": "35389665", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9674102549084582, "ground_truth": 0}, {"key": "35389665", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9585377279447193, "ground_truth": 0}, {"key": "35389665", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9559813472365548, "ground_truth": 0}, {"key": "35389665", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9621075761808726, "ground_truth": 0}, {"key": "35389665", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.956957149497176, "ground_truth": 0}, {"key": "33080187", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6723317155599324, "ground_truth": 0}, {"key": "33080187", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850271258235, "ground_truth": 0}, {"key": "33080187", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6406358598755644, "ground_truth": 0}, {"key": "33080187", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948031228194, "ground_truth": 0}, {"key": "33080187", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714996839114, "ground_truth": 0}, {"key": "38636995", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7994423120097226, "ground_truth": 0}, {"key": "38636995", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892337023195426, "ground_truth": 0}, {"key": "38636995", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431679900449308, "ground_truth": 0}, {"key": "38636995", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740331087153, "ground_truth": 0}, {"key": "38636995", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239867615682, "ground_truth": 0}, {"key": "18536236", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8774767791105742, "ground_truth": 0}, {"key": "18536236", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872092647896, "ground_truth": 0}, {"key": "18536236", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6076631621140685, "ground_truth": 0}, {"key": "18536236", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581671991659, "ground_truth": 0}, {"key": "18536236", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149642648204, "ground_truth": 0}, {"key": "36289151", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5350984394781242, "ground_truth": 0}, {"key": "36289151", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7025300685245134, "ground_truth": 0}, {"key": "36289151", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5544704655475685, "ground_truth": 0}, {"key": "36289151", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137078649875, "ground_truth": 0}, {"key": "36289151", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460136737864919, "ground_truth": 0}, {"key": "23017045", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367911054787, "ground_truth": 0}, {"key": "23017045", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8832359936833153, "ground_truth": 0}, {"key": "23017045", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8955226711779568, "ground_truth": 0}, {"key": "23017045", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797609678471, "ground_truth": 0}, {"key": "23017045", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122283927111, "ground_truth": 0}, {"key": "36418082", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8080672335540731, "ground_truth": 0}, {"key": "36418082", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.738669082637639, "ground_truth": 0}, {"key": "36418082", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8418256545999929, "ground_truth": 0}, {"key": "36418082", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430369964623, "ground_truth": 0}, {"key": "36418082", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867801022527, "ground_truth": 0}, {"key": "34396551", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7008948084866393, "ground_truth": 0}, {"key": "34396551", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5679366088866208, "ground_truth": 0}, {"key": "34396551", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6261241889881943, "ground_truth": 0}, {"key": "34396551", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548764417493, "ground_truth": 0}, {"key": "34396551", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632737031874, "ground_truth": 0}, {"key": "39720944", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9736446493343581, "ground_truth": 0}, {"key": "39720944", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9353465079222274, "ground_truth": 0}, {"key": "39720944", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9609517111913002, "ground_truth": 0}, {"key": "39720944", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218432393143, "ground_truth": 0}, {"key": "39720944", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.949669374273024, "ground_truth": 0}, {"key": "35884842", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6909762950321238, "ground_truth": 0}, {"key": "35884842", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6187804135254682, "ground_truth": 0}, {"key": "35884842", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5813031170218991, "ground_truth": 0}, {"key": "35884842", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.583203384282273, "ground_truth": 0}, {"key": "35884842", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984328889009, "ground_truth": 0}, {"key": "35403375", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.611381993220654, "ground_truth": 0}, {"key": "35403375", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5774953681751799, "ground_truth": 0}, {"key": "35403375", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5869964499806926, "ground_truth": 0}, {"key": "35403375", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4746311807897404, "ground_truth": 0}, {"key": "35403375", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438008641014363, "ground_truth": 0}, {"key": "26341324", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9235923137405235, "ground_truth": 0}, {"key": "26341324", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9284088028173079, "ground_truth": 0}, {"key": "26341324", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.877476792068509, "ground_truth": 0}, {"key": "26341324", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288497943097, "ground_truth": 0}, {"key": "26341324", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891209184775, "ground_truth": 0}, {"key": "19212345", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744832634994, "ground_truth": 0}, {"key": "19212345", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8714748697039828, "ground_truth": 0}, {"key": "19212345", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9019206715775722, "ground_truth": 0}, {"key": "19212345", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149083498089, "ground_truth": 0}, {"key": "19212345", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743665784279, "ground_truth": 0}, {"key": "30548367", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6654105438367345, "ground_truth": 0}, {"key": "30548367", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7759445504137781, "ground_truth": 0}, {"key": "30548367", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8723473716769018, "ground_truth": 0}, {"key": "30548367", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666751358965, "ground_truth": 0}, {"key": "30548367", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059484856539, "ground_truth": 0}, {"key": "37919402", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8438951242840325, "ground_truth": 0}, {"key": "37919402", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.890294228490072, "ground_truth": 0}, {"key": "37919402", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8548846278957265, "ground_truth": 0}, {"key": "37919402", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357584711866, "ground_truth": 0}, {"key": "37919402", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942228911621, "ground_truth": 0}, {"key": "39995133", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8976952935281627, "ground_truth": 0}, {"key": "39995133", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.929440407454711, "ground_truth": 0}, {"key": "39995133", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.885631466655598, "ground_truth": 0}, {"key": "39995133", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872045849774747, "ground_truth": 0}, {"key": "39995133", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281534638477, "ground_truth": 0}, {"key": "40249088", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6842640307591472, "ground_truth": 0}, {"key": "40249088", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8697145739514511, "ground_truth": 0}, {"key": "40249088", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5755880321577188, "ground_truth": 0}, {"key": "40249088", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918211592441, "ground_truth": 0}, {"key": "40249088", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149722452763, "ground_truth": 0}, {"key": "40254388", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6495786069045345, "ground_truth": 0}, {"key": "40254388", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8019358106183911, "ground_truth": 0}, {"key": "40254388", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6893056441234579, "ground_truth": 0}, {"key": "40254388", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382191307284, "ground_truth": 0}, {"key": "40254388", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933218432873, "ground_truth": 0}, {"key": "31995230", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8152324870790919, "ground_truth": 0}, {"key": "31995230", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125887686024, "ground_truth": 0}, {"key": "31995230", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7461390018468073, "ground_truth": 0}, {"key": "31995230", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928833213284, "ground_truth": 0}, {"key": "31995230", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430522556197, "ground_truth": 0}, {"key": "38632129", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9640516800495701, "ground_truth": 0}, {"key": "38632129", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9671630442247265, "ground_truth": 0}, {"key": "38632129", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9713473306913591, "ground_truth": 0}, {"key": "38632129", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9648551513749979, "ground_truth": 0}, {"key": "38632129", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9546474205384909, "ground_truth": 0}, {"key": "35720795", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797652149177, "ground_truth": 0}, {"key": "35720795", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.746138988443664, "ground_truth": 0}, {"key": "35720795", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998664846931, "ground_truth": 0}, {"key": "35720795", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185717920515, "ground_truth": 0}, {"key": "35720795", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044058950954015, "ground_truth": 0}, {"key": "23906759", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9532750426667815, "ground_truth": 0}, {"key": "23906759", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9485372356747039, "ground_truth": 0}, {"key": "23906759", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9525741238421701, "ground_truth": 0}, {"key": "23906759", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9579122749616348, "ground_truth": 0}, {"key": "23906759", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9536217894048091, "ground_truth": 0}, {"key": "19410108", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7122322034586918, "ground_truth": 0}, {"key": "19410108", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8407825906290934, "ground_truth": 0}, {"key": "19410108", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7943849753743067, "ground_truth": 0}, {"key": "19410108", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919927157679, "ground_truth": 0}, {"key": "19410108", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951163963477, "ground_truth": 0}, {"key": "30745137", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315943127887631, "ground_truth": 0}, {"key": "30745137", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159616753345, "ground_truth": 0}, {"key": "30745137", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956581092182996, "ground_truth": 0}, {"key": "30745137", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765060921068, "ground_truth": 0}, {"key": "30745137", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419790087318, "ground_truth": 0}, {"key": "26553115", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7341195155057523, "ground_truth": 0}, {"key": "26553115", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.760650653268367, "ground_truth": 0}, {"key": "26553115", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006919947551266, "ground_truth": 0}, {"key": "26553115", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754398505621, "ground_truth": 0}, {"key": "26553115", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504781889336, "ground_truth": 0}, {"key": "37872311", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.705785024112302, "ground_truth": 0}, {"key": "37872311", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6406358586466767, "ground_truth": 0}, {"key": "37872311", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7718434879665959, "ground_truth": 0}, {"key": "37872311", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631424171512, "ground_truth": 0}, {"key": "37872311", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159638324448, "ground_truth": 0}, {"key": "35553131", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9462003569240605, "ground_truth": 0}, {"key": "35553131", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.951142222381082, "ground_truth": 0}, {"key": "35553131", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9235923172045327, "ground_truth": 0}, {"key": "35553131", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916164807875, "ground_truth": 0}, {"key": "35553131", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549508100852, "ground_truth": 0}, {"key": "39038936", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6442250872149151, "ground_truth": 0}, {"key": "39038936", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7718435164699917, "ground_truth": 0}, {"key": "39038936", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7371581796543525, "ground_truth": 0}, {"key": "39038936", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837478056571, "ground_truth": 0}, {"key": "39038936", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527554107169, "ground_truth": 0}, {"key": "38735486", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9828232915454139, "ground_truth": 0}, {"key": "38735486", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9939024374166592, "ground_truth": 0}, {"key": "38735486", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9846936446124964, "ground_truth": 0}, {"key": "38735486", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9881308796007833, "ground_truth": 0}, {"key": "38735486", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9911526437722776, "ground_truth": 0}, {"key": "17087845", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5234203752142933, "ground_truth": 0}, {"key": "17087845", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6976089277841587, "ground_truth": 0}, {"key": "17087845", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6723316962268352, "ground_truth": 0}, {"key": "17087845", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684398072565, "ground_truth": 0}, {"key": "17087845", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269974843041, "ground_truth": 0}, {"key": "37443011", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8221891274970166, "ground_truth": 0}, {"key": "37443011", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7248702637530862, "ground_truth": 0}, {"key": "37443011", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.787931208279687, "ground_truth": 0}, {"key": "37443011", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942227407863, "ground_truth": 0}, {"key": "37443011", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680210938489, "ground_truth": 0}, {"key": "36855749", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8633916185885936, "ground_truth": 0}, {"key": "36855749", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8799743783304419, "ground_truth": 0}, {"key": "36855749", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7759445465108339, "ground_truth": 0}, {"key": "36855749", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511474884297, "ground_truth": 0}, {"key": "36855749", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647047230348, "ground_truth": 0}, {"key": "35613141", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9678992950753746, "ground_truth": 0}, {"key": "35613141", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9591542854625367, "ground_truth": 0}, {"key": "35613141", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9390248194801455, "ground_truth": 0}, {"key": "35613141", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9289263287763672, "ground_truth": 0}, {"key": "35613141", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9425067239917316, "ground_truth": 0}, {"key": "39088847", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8459424449298367, "ground_truth": 0}, {"key": "39088847", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6876299876038546, "ground_truth": 0}, {"key": "39088847", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358185396279, "ground_truth": 0}, {"key": "39088847", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215545515439, "ground_truth": 0}, {"key": "39088847", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423271170654, "ground_truth": 0}, {"key": "33197277", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575585116599, "ground_truth": 0}, {"key": "33197277", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619219487531, "ground_truth": 0}, {"key": "33197277", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.903294210710621, "ground_truth": 0}, {"key": "33197277", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358274541025, "ground_truth": 0}, {"key": "33197277", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837616307338, "ground_truth": 0}, {"key": "33815489", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6619228959715169, "ground_truth": 0}, {"key": "33815489", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6001883487566501, "ground_truth": 0}, {"key": "33815489", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6370308026005674, "ground_truth": 0}, {"key": "33815489", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093876217113, "ground_truth": 0}, {"key": "33815489", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819742464993, "ground_truth": 0}, {"key": "35862754", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9167080759977708, "ground_truth": 0}, {"key": "35862754", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9086178929875037, "ground_truth": 0}, {"key": "35862754", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8670357579559201, "ground_truth": 0}, {"key": "35862754", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743696136324, "ground_truth": 0}, {"key": "35862754", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.892562532406242, "ground_truth": 0}, {"key": "36080615", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6224593254003319, "ground_truth": 0}, {"key": "36080615", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5907792054188793, "ground_truth": 0}, {"key": "36080615", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.721743220731985, "ground_truth": 0}, {"key": "36080615", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254008345269, "ground_truth": 0}, {"key": "36080615", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102644314282, "ground_truth": 0}, {"key": "22822742", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8661325158482331, "ground_truth": 0}, {"key": "22822742", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.863391601255352, "ground_truth": 0}, {"key": "22822742", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8479677627639146, "ground_truth": 0}, {"key": "22822742", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104635304512, "ground_truth": 0}, {"key": "22822742", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625254513704, "ground_truth": 0}, {"key": "39747536", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9284088014139533, "ground_truth": 0}, {"key": "39747536", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9314625015435751, "ground_truth": 0}, {"key": "39747536", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.939913350460297, "ground_truth": 0}, {"key": "39747536", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759623593183, "ground_truth": 0}, {"key": "39747536", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418181097316, "ground_truth": 0}, {"key": "34218396", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7918210569179478, "ground_truth": 0}, {"key": "34218396", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.871474865812181, "ground_truth": 0}, {"key": "34218396", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8940517156042945, "ground_truth": 0}, {"key": "34218396", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.866132510323489, "ground_truth": 0}, {"key": "34218396", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849498620418, "ground_truth": 0}, {"key": "39150388", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.884039274370545, "ground_truth": 0}, {"key": "39150388", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.847967763897706, "ground_truth": 0}, {"key": "39150388", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289387995934971, "ground_truth": 0}, {"key": "39150388", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267711520603, "ground_truth": 0}, {"key": "39150388", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314699806306, "ground_truth": 0}, {"key": "28765782", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104517837247, "ground_truth": 0}, {"key": "28765782", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7138307645534441, "ground_truth": 0}, {"key": "28765782", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8697145762260212, "ground_truth": 0}, {"key": "28765782", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517155953135, "ground_truth": 0}, {"key": "28765782", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253771933963, "ground_truth": 0}, {"key": "35828022", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.3380771324599187, "ground_truth": 0}, {"key": "35828022", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6706082678759018, "ground_truth": 0}, {"key": "35828022", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059283533492, "ground_truth": 0}, {"key": "35828022", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191403522924, "ground_truth": 0}, {"key": "35828022", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715236095751, "ground_truth": 0}, {"key": "27717735", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7371581576708697, "ground_truth": 0}, {"key": "27717735", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6132365623680078, "ground_truth": 0}, {"key": "27717735", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6842640172170881, "ground_truth": 0}, {"key": "27717735", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582373893397, "ground_truth": 0}, {"key": "27717735", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307593402983, "ground_truth": 0}, {"key": "37977826", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6424324461113429, "ground_truth": 0}, {"key": "37977826", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6548947306177915, "ground_truth": 0}, {"key": "37977826", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5717666083959939, "ground_truth": 0}, {"key": "37977826", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646090243336, "ground_truth": 0}, {"key": "37977826", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.69097628536045, "ground_truth": 0}, {"key": "31768588", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9241418195211395, "ground_truth": 0}, {"key": "31768588", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.922482344485492, "ground_truth": 0}, {"key": "31768588", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.952574123367987, "ground_truth": 0}, {"key": "31768588", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869898169142, "ground_truth": 0}, {"key": "31768588", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218437739088, "ground_truth": 0}, {"key": "37183351", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.49609379522282665, "ground_truth": 0}, {"key": "37183351", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.49609386103321407, "ground_truth": 0}, {"key": "37183351", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5621764785985208, "ground_truth": 0}, {"key": "37183351", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.513668498984097, "ground_truth": 0}, {"key": "37183351", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199378068065, "ground_truth": 0}, {"key": "39622090", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256471986507, "ground_truth": 0}, {"key": "39622090", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8661325244783065, "ground_truth": 0}, {"key": "39622090", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8624675313851996, "ground_truth": 0}, {"key": "39622090", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104635622003, "ground_truth": 0}, {"key": "39622090", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916107771397, "ground_truth": 0}, {"key": "39272756", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6513548570328938, "ground_truth": 0}, {"key": "39272756", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5640984569809706, "ground_truth": 0}, {"key": "39272756", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.46295860919280585, "ground_truth": 0}, {"key": "39272756", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740466397965, "ground_truth": 0}, {"key": "39272756", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527492308167, "ground_truth": 0}, {"key": "32138822", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6619228759794394, "ground_truth": 0}, {"key": "32138822", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7356416762564961, "ground_truth": 0}, {"key": "32138822", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7295197706843376, "ground_truth": 0}, {"key": "32138822", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191462713665, "ground_truth": 0}, {"key": "32138822", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920003570847, "ground_truth": 0}, {"key": "31070114", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6513548521707895, "ground_truth": 0}, {"key": "31070114", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5602526361493448, "ground_truth": 0}, {"key": "31070114", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.560252636138896, "ground_truth": 0}, {"key": "31070114", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552955060496147, "ground_truth": 0}, {"key": "31070114", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121998008764, "ground_truth": 0}, {"key": "39652762", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9394706123699366, "ground_truth": 0}, {"key": "39652762", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9437636521784534, "ground_truth": 0}, {"key": "39652762", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.955319133774926, "ground_truth": 0}, {"key": "39652762", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.860603627802553, "ground_truth": 0}, {"key": "39652762", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671436616151, "ground_truth": 0}, {"key": "33258866", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5907792017532035, "ground_truth": 0}, {"key": "33258866", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.605799063395154, "ground_truth": 0}, {"key": "33258866", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6352224370405702, "ground_truth": 0}, {"key": "33258866", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033664647218, "ground_truth": 0}, {"key": "33258866", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381469219219, "ground_truth": 0}, {"key": "36962388", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666501484689, "ground_truth": 0}, {"key": "36962388", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6548947271817418, "ground_truth": 0}, {"key": "36962388", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140528048114557, "ground_truth": 0}, {"key": "36962388", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026741781033, "ground_truth": 0}, {"key": "36962388", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336802477713, "ground_truth": 0}, {"key": "32282272", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5794004256487828, "ground_truth": 0}, {"key": "32282272", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.41111085665756936, "ground_truth": 0}, {"key": "32282272", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7325918347500131, "ground_truth": 0}, {"key": "32282272", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804787025927059, "ground_truth": 0}, {"key": "32282272", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881028047417, "ground_truth": 0}, {"key": "36093072", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9167080740852452, "ground_truth": 0}, {"key": "36093072", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8633916050988781, "ground_truth": 0}, {"key": "36093072", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9252299571808864, "ground_truth": 0}, {"key": "36093072", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105515080522, "ground_truth": 0}, {"key": "36093072", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.902609602517581, "ground_truth": 0}, {"key": "38879972", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7401743702314633, "ground_truth": 0}, {"key": "38879972", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8688267763564433, "ground_truth": 0}, {"key": "38879972", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7718435039712788, "ground_truth": 0}, {"key": "38879972", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681124056504, "ground_truth": 0}, {"key": "38879972", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063623012047, "ground_truth": 0}, {"key": "32106473", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6187804183940798, "ground_truth": 0}, {"key": "32106473", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217432140698928, "ground_truth": 0}, {"key": "32106473", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7662936452945996, "ground_truth": 0}, {"key": "32106473", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.732591849795788, "ground_truth": 0}, {"key": "32106473", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321850775631, "ground_truth": 0}, {"key": "40415815", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6909762735973923, "ground_truth": 0}, {"key": "40415815", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6671476472187824, "ground_truth": 0}, {"key": "40415815", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.567936602647344, "ground_truth": 0}, {"key": "40415815", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494529711748, "ground_truth": 0}, {"key": "40415815", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948194405314, "ground_truth": 0}, {"key": "34581918", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575539001439, "ground_truth": 0}, {"key": "34581918", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7090191639034651, "ground_truth": 0}, {"key": "34581918", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5832033577806313, "ground_truth": 0}, {"key": "34581918", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336861780846, "ground_truth": 0}, {"key": "34581918", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909763015406503, "ground_truth": 0}, {"key": "33004157", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9142907239370238, "ground_truth": 0}, {"key": "33004157", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8652240881075973, "ground_truth": 0}, {"key": "33004157", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8757869959607418, "ground_truth": 0}, {"key": "33004157", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333246059018203, "ground_truth": 0}, {"key": "33004157", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110409563643, "ground_truth": 0}, {"key": "30334943", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9339146191928246, "ground_truth": 0}, {"key": "30334943", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9252299613722449, "ground_truth": 0}, {"key": "30334943", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9046505313553983, "ground_truth": 0}, {"key": "30334943", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346116580362, "ground_truth": 0}, {"key": "30334943", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9207896697490404, "ground_truth": 0}, {"key": "33280503", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8080672174795934, "ground_truth": 0}, {"key": "33280503", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8661325199084033, "ground_truth": 0}, {"key": "33280503", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358378927811, "ground_truth": 0}, {"key": "33280503", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423183398329, "ground_truth": 0}, {"key": "33280503", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063684817899, "ground_truth": 0}, {"key": "25726782", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897183618437, "ground_truth": 0}, {"key": "25726782", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187368058156522, "ground_truth": 0}, {"key": "25726782", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8816148993024588, "ground_truth": 0}, {"key": "25726782", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759615220247, "ground_truth": 0}, {"key": "25726782", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.896975575522972, "ground_truth": 0}, {"key": "35479854", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7264255841667248, "ground_truth": 0}, {"key": "35479854", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.752012585275136, "ground_truth": 0}, {"key": "35479854", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104788984843048, "ground_truth": 0}, {"key": "35479854", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928865437782, "ground_truth": 0}, {"key": "35479854", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.687629995030721, "ground_truth": 0}, {"key": "32716226", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6442251021361913, "ground_truth": 0}, {"key": "32716226", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.600188379236598, "ground_truth": 0}, {"key": "32716226", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6477982159274435, "ground_truth": 0}, {"key": "32716226", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089219556603, "ground_truth": 0}, {"key": "32716226", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435170241946, "ground_truth": 0}, {"key": "37047554", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8879840423076084, "ground_truth": 0}, {"key": "37047554", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7853085828756434, "ground_truth": 0}, {"key": "37047554", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253613056662, "ground_truth": 0}, {"key": "37047554", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878376705099, "ground_truth": 0}, {"key": "37047554", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506754172334, "ground_truth": 0}, {"key": "36565290", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7505527594179393, "ground_truth": 0}, {"key": "36565290", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6959583051739577, "ground_truth": 0}, {"key": "36565290", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8322366507888341, "ground_truth": 0}, {"key": "36565290", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437735591947, "ground_truth": 0}, {"key": "36565290", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306236645312, "ground_truth": 0}, {"key": "27758640", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6808786259983278, "ground_truth": 0}, {"key": "27758640", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7201715137437756, "ground_truth": 0}, {"key": "27758640", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998588375634, "ground_truth": 0}, {"key": "27758640", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303033220498, "ground_truth": 0}, {"key": "27758640", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743766020147, "ground_truth": 0}, {"key": "28897118", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333245937167223, "ground_truth": 0}, {"key": "28897118", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490871967738691, "ground_truth": 0}, {"key": "28897118", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8449215310526932, "ground_truth": 0}, {"key": "28897118", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624956937472, "ground_truth": 0}, {"key": "28897118", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.819893340228963, "ground_truth": 0}, {"key": "38452661", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.918480237739751, "ground_truth": 0}, {"key": "38452661", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511356445754, "ground_truth": 0}, {"key": "38452661", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8210441197522075, "ground_truth": 0}, {"key": "38452661", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358314061016, "ground_truth": 0}, {"key": "38452661", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388147352585, "ground_truth": 0}, {"key": "38033492", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.613236559678499, "ground_truth": 0}, {"key": "38033492", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7122321871373855, "ground_truth": 0}, {"key": "38033492", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5486735010845449, "ground_truth": 0}, {"key": "38033492", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786275770428, "ground_truth": 0}, {"key": "38033492", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504806059897, "ground_truth": 0}, {"key": "35949555", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9309620695193978, "ground_truth": 0}, {"key": "35949555", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9549844713167378, "ground_truth": 0}, {"key": "35949555", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9394706077475312, "ground_truth": 0}, {"key": "35949555", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9615338104576702, "ground_truth": 0}, {"key": "35949555", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9591542810528855, "ground_truth": 0}, {"key": "15263826", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7476159745780642, "ground_truth": 0}, {"key": "15263826", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8438951056383999, "ground_truth": 0}, {"key": "15263826", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9092645163561676, "ground_truth": 0}, {"key": "15263826", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.88720460391841, "ground_truth": 0}, {"key": "15263826", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748601010455, "ground_truth": 0}, {"key": "37313866", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199454921344, "ground_truth": 0}, {"key": "37313866", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6039318028241294, "ground_truth": 0}, {"key": "37313866", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6495786022279351, "ground_truth": 0}, {"key": "37313866", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185944012374239, "ground_truth": 0}, {"key": "37313866", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191133442829, "ground_truth": 0}, {"key": "13911157", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8558511502594481, "ground_truth": 0}, {"key": "13911157", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9257686275849075, "ground_truth": 0}, {"key": "13911157", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8333245901765146, "ground_truth": 0}, {"key": "13911157", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104625329833, "ground_truth": 0}, {"key": "13911157", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583507094039, "ground_truth": 0}, {"key": "39594894", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6740505056167236, "ground_truth": 0}, {"key": "39594894", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7008948213202655, "ground_truth": 0}, {"key": "39594894", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5292633979906359, "ground_truth": 0}, {"key": "39594894", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786106360613, "ground_truth": 0}, {"key": "39594894", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689458674836, "ground_truth": 0}, {"key": "34096170", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367961140124, "ground_truth": 0}, {"key": "34096170", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.78266247823044, "ground_truth": 0}, {"key": "34096170", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338316815837, "ground_truth": 0}, {"key": "34096170", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738165399447, "ground_truth": 0}, {"key": "34096170", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786492996587944, "ground_truth": 0}, {"key": "37891952", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9697854108206123, "ground_truth": 0}, {"key": "37891952", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9481545346662068, "ground_truth": 0}, {"key": "37891952", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.970013490110367, "ground_truth": 0}, {"key": "37891952", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9612438072361443, "ground_truth": 0}, {"key": "37891952", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9385759572596253, "ground_truth": 0}, {"key": "40186158", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8365545564183478, "ground_truth": 0}, {"key": "40186158", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6943026534174038, "ground_truth": 0}, {"key": "40186158", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631400798895, "ground_truth": 0}, {"key": "40186158", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743686455614, "ground_truth": 0}, {"key": "40186158", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833689422371, "ground_truth": 0}, {"key": "37049719", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7879311947951293, "ground_truth": 0}, {"key": "37049719", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.699254420566707, "ground_truth": 0}, {"key": "37049719", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8879840379453096, "ground_truth": 0}, {"key": "37049719", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122966419149, "ground_truth": 0}, {"key": "37049719", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711573779316, "ground_truth": 0}, {"key": "34610504", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9425067186895405, "ground_truth": 0}, {"key": "34610504", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9053222876052943, "ground_truth": 0}, {"key": "34610504", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9284088019717531, "ground_truth": 0}, {"key": "34610504", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053222923790865, "ground_truth": 0}, {"key": "34610504", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9504109750268722, "ground_truth": 0}, {"key": "37595429", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8962513689869176, "ground_truth": 0}, {"key": "37595429", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8548846413283551, "ground_truth": 0}, {"key": "37595429", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8940517126616356, "ground_truth": 0}, {"key": "37595429", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942178961254, "ground_truth": 0}, {"key": "37595429", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.905989823438292, "ground_truth": 0}, {"key": "29772670", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8438950974983364, "ground_truth": 0}, {"key": "29772670", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8354835406786499, "ground_truth": 0}, {"key": "29772670", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933346032086, "ground_truth": 0}, {"key": "29772670", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916009034156, "ground_truth": 0}, {"key": "29772670", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210440935522222, "ground_truth": 0}, {"key": "36369872", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8322366573426494, "ground_truth": 0}, {"key": "36369872", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5621765000189001, "ground_truth": 0}, {"key": "36369872", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6808786120074758, "ground_truth": 0}, {"key": "36369872", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646066992243, "ground_truth": 0}, {"key": "36369872", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085737172338, "ground_truth": 0}, {"key": "34527433", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5698526632401394, "ground_truth": 0}, {"key": "34527433", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.540923875929986, "ground_truth": 0}, {"key": "34527433", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.4016877982067012, "ground_truth": 0}, {"key": "34527433", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784100577523, "ground_truth": 0}, {"key": "34527433", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167812879029, "ground_truth": 0}, {"key": "31111734", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8832359939358371, "ground_truth": 0}, {"key": "31111734", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933360728426, "ground_truth": 0}, {"key": "31111734", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8969755740284279, "ground_truth": 0}, {"key": "31111734", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835278707791, "ground_truth": 0}, {"key": "31111734", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578440417995, "ground_truth": 0}, {"key": "40303872", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704647875171531, "ground_truth": 0}, {"key": "40303872", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7662936303801902, "ground_truth": 0}, {"key": "40303872", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6893056485245826, "ground_truth": 0}, {"key": "40303872", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936522100579, "ground_truth": 0}, {"key": "40303872", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187368103695477, "ground_truth": 0}, {"key": "33653553", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7325918343048112, "ground_truth": 0}, {"key": "33653553", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8233284012697629, "ground_truth": 0}, {"key": "33653553", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6909762977974281, "ground_truth": 0}, {"key": "33653553", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191234862173, "ground_truth": 0}, {"key": "33653553", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.781330629226784, "ground_truth": 0}, {"key": "34404510", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849562598329, "ground_truth": 0}, {"key": "34404510", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8044059417710883, "ground_truth": 0}, {"key": "34404510", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7416740064763061, "ground_truth": 0}, {"key": "34404510", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215346824183, "ground_truth": 0}, {"key": "34404510", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723819201896, "ground_truth": 0}, {"key": "35568692", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6688802528977872, "ground_truth": 0}, {"key": "35568692", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6224593515267233, "ground_truth": 0}, {"key": "35568692", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5448014026624012, "ground_truth": 0}, {"key": "35568692", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241653782639, "ground_truth": 0}, {"key": "35568692", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191248159574, "ground_truth": 0}, {"key": "39151664", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6334102453464362, "ground_truth": 0}, {"key": "39151664", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7446563333503028, "ground_truth": 0}, {"key": "39151664", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.702530063396483, "ground_truth": 0}, {"key": "39151664", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337083308177, "ground_truth": 0}, {"key": "39151664", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056089042927, "ground_truth": 0}, {"key": "37493670", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9929335993338114, "ground_truth": 0}, {"key": "37493670", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9930423913862676, "ground_truth": 0}, {"key": "37493670", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.990366347300694, "ground_truth": 0}, {"key": "37493670", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9940428455822581, "ground_truth": 0}, {"key": "37493670", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9919380079612223, "ground_truth": 0}, {"key": "21935983", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6992544095641304, "ground_truth": 0}, {"key": "21935983", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6531269074442005, "ground_truth": 0}, {"key": "21935983", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6976089030543793, "ground_truth": 0}, {"key": "21935983", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293642496568, "ground_truth": 0}, {"key": "21935983", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416219661845, "ground_truth": 0}, {"key": "38174214", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8509647056489239, "ground_truth": 0}, {"key": "38174214", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8887588071038417, "ground_truth": 0}, {"key": "38174214", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9105454088401652, "ground_truth": 0}, {"key": "38174214", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757870017824789, "ground_truth": 0}, {"key": "38174214", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.871474869652751, "ground_truth": 0}, {"key": "40319923", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9257686318979801, "ground_truth": 0}, {"key": "40319923", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9507778887303908, "ground_truth": 0}, {"key": "40319923", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8955226720023116, "ground_truth": 0}, {"key": "40319923", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531140969144, "ground_truth": 0}, {"key": "40319923", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907083172191, "ground_truth": 0}, {"key": "36478264", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802401039178, "ground_truth": 0}, {"key": "36478264", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333245995235079, "ground_truth": 0}, {"key": "36478264", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8749346202393304, "ground_truth": 0}, {"key": "36478264", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897379635395, "ground_truth": 0}, {"key": "36478264", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956581188577092, "ground_truth": 0}, {"key": "11935769", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5563995724032411, "ground_truth": 0}, {"key": "11935769", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7577943665647797, "ground_truth": 0}, {"key": "11935769", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307680589175, "ground_truth": 0}, {"key": "11935769", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195212791726, "ground_truth": 0}, {"key": "11935769", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583163624741, "ground_truth": 0}, {"key": "33373410", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.616935821058153, "ground_truth": 0}, {"key": "33373410", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754348235987, "ground_truth": 0}, {"key": "33373410", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.690976298890516, "ground_truth": 0}, {"key": "33373410", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434924022127, "ground_truth": 0}, {"key": "33373410", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321825726811, "ground_truth": 0}, {"key": "11130680", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8679338380827794, "ground_truth": 0}, {"key": "11130680", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8080672224507178, "ground_truth": 0}, {"key": "11130680", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5832033507091418, "ground_truth": 0}, {"key": "11130680", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755664931452, "ground_truth": 0}, {"key": "11130680", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059282369023, "ground_truth": 0}, {"key": "34868650", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6926419879050774, "ground_truth": 0}, {"key": "34868650", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.690976290237154, "ground_truth": 0}, {"key": "34868650", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7057850296557715, "ground_truth": 0}, {"key": "34868650", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702895362108, "ground_truth": 0}, {"key": "34868650", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118708879557, "ground_truth": 0}, {"key": "33960561", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8044059252170592, "ground_truth": 0}, {"key": "33960561", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6688802616953745, "ground_truth": 0}, {"key": "33960561", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7008948150992045, "ground_truth": 0}, {"key": "33960561", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240745662709, "ground_truth": 0}, {"key": "33960561", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239815565137, "ground_truth": 0}, {"key": "22504858", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8732148386804719, "ground_truth": 0}, {"key": "22504858", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8925625244413178, "ground_truth": 0}, {"key": "22504858", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9329437178662374, "ground_truth": 0}, {"key": "22504858", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9105454009443821, "ground_truth": 0}, {"key": "22504858", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942317841273, "ground_truth": 0}, {"key": "32283530", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802383543934, "ground_truth": 0}, {"key": "32283530", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.694302655837431, "ground_truth": 0}, {"key": "32283530", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8386797660312545, "ground_truth": 0}, {"key": "32283530", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677542494986, "ground_truth": 0}, {"key": "32283530", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416495621994, "ground_truth": 0}, {"key": "38377099", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849760845559, "ground_truth": 0}, {"key": "38377099", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7866228154739188, "ground_truth": 0}, {"key": "38377099", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056321781274761, "ground_truth": 0}, {"key": "38377099", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898675649482, "ground_truth": 0}, {"key": "38377099", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145842140889, "ground_truth": 0}, {"key": "36105123", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.895522666252668, "ground_truth": 0}, {"key": "36105123", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.951863231503957, "ground_truth": 0}, {"key": "36105123", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9433475763752849, "ground_truth": 0}, {"key": "36105123", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872024175946, "ground_truth": 0}, {"key": "36105123", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9403530606305088, "ground_truth": 0}, {"key": "33527826", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8300437609982972, "ground_truth": 0}, {"key": "33527826", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7341195302560456, "ground_truth": 0}, {"key": "33527826", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8386797610055884, "ground_truth": 0}, {"key": "33527826", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197876941234, "ground_truth": 0}, {"key": "33527826", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528135397076, "ground_truth": 0}, {"key": "32349891", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8519528039222604, "ground_truth": 0}, {"key": "32349891", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8397339656753952, "ground_truth": 0}, {"key": "32349891", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8697145867440187, "ground_truth": 0}, {"key": "32349891", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.856812293735624, "ground_truth": 0}, {"key": "32349891", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215330482541, "ground_truth": 0}, {"key": "34281974", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6370308153358822, "ground_truth": 0}, {"key": "34281974", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6477982081144138, "ground_truth": 0}, {"key": "34281974", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5312093428648873, "ground_truth": 0}, {"key": "34281974", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679365766060057, "ground_truth": 0}, {"key": "34281974", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666042957952, "ground_truth": 0}, {"key": "29387866", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7956581247345845, "ground_truth": 0}, {"key": "29387866", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6169358280311775, "ground_truth": 0}, {"key": "29387866", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933288982705, "ground_truth": 0}, {"key": "29387866", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.771843496910198, "ground_truth": 0}, {"key": "29387866", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.649578613587656, "ground_truth": 0}, {"key": "35731925", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9911526454865123, "ground_truth": 0}, {"key": "35731925", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9971104189359119, "ground_truth": 0}, {"key": "35731925", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9873750512107716, "ground_truth": 0}, {"key": "35731925", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9929335993021842, "ground_truth": 0}, {"key": "35731925", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.989671847433208, "ground_truth": 0}, {"key": "38829733", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407825991019403, "ground_truth": 0}, {"key": "38829733", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568122995507875, "ground_truth": 0}, {"key": "38829733", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253833594664, "ground_truth": 0}, {"key": "38829733", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869949267784, "ground_truth": 0}, {"key": "38829733", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441059063702, "ground_truth": 0}, {"key": "24624736", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8529354706245731, "ground_truth": 0}, {"key": "24624736", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8643104696432483, "ground_truth": 0}, {"key": "24624736", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9273632938437323, "ground_truth": 0}, {"key": "24624736", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267741043513, "ground_truth": 0}, {"key": "24624736", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511614107702, "ground_truth": 0}, {"key": "36928562", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9933588877299466, "ground_truth": 0}, {"key": "36928562", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9914886968657043, "ground_truth": 0}, {"key": "36928562", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9931495202838224, "ground_truth": 0}, {"key": "36928562", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9907319869530571, "ground_truth": 0}, {"key": "36928562", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9934102286410945, "ground_truth": 0}, {"key": "34941119", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6740504866045562, "ground_truth": 0}, {"key": "34941119", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6020615794544149, "ground_truth": 0}, {"key": "34941119", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6601723903081614, "ground_truth": 0}, {"key": "34941119", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159689554401, "ground_truth": 0}, {"key": "34941119", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640350906337, "ground_truth": 0}, {"key": "30206231", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7520125566408231, "ground_truth": 0}, {"key": "30206231", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125657625873, "ground_truth": 0}, {"key": "30206231", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.717011873687711, "ground_truth": 0}, {"key": "30206231", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757870057467415, "ground_truth": 0}, {"key": "30206231", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884546691165, "ground_truth": 0}, {"key": "35584972", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254038105358, "ground_truth": 0}, {"key": "35584972", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998495621543, "ground_truth": 0}, {"key": "35584972", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7534666513464112, "ground_truth": 0}, {"key": "35584972", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675306212234, "ground_truth": 0}, {"key": "35584972", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148364827373, "ground_truth": 0}, {"key": "39277709", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615381994297229, "ground_truth": 0}, {"key": "39277709", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8856314651523955, "ground_truth": 0}, {"key": "39277709", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8824278565643752, "ground_truth": 0}, {"key": "39277709", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850286775151, "ground_truth": 0}, {"key": "39277709", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325194522425, "ground_truth": 0}, {"key": "36123657", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8872045969232154, "ground_truth": 0}, {"key": "36123657", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8940517083225189, "ground_truth": 0}, {"key": "36123657", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9289263339984093, "ground_truth": 0}, {"key": "36123657", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377699648418, "ground_truth": 0}, {"key": "36123657", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.882427858685526, "ground_truth": 0}, {"key": "33363938", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8832359794983237, "ground_truth": 0}, {"key": "33363938", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6842640255033261, "ground_truth": 0}, {"key": "33363938", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.866132516624813, "ground_truth": 0}, {"key": "33363938", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9314625106179045, "ground_truth": 0}, {"key": "33363938", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122138119725, "ground_truth": 0}, {"key": "37349129", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.828938822193074, "ground_truth": 0}, {"key": "37349129", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511501535943, "ground_truth": 0}, {"key": "37349129", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8766343887884626, "ground_truth": 0}, {"key": "37349129", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849744164609, "ground_truth": 0}, {"key": "37349129", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.850964699433691, "ground_truth": 0}, {"key": "37160199", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6654105740798317, "ground_truth": 0}, {"key": "37160199", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.704160133490394, "ground_truth": 0}, {"key": "37160199", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253721673003, "ground_truth": 0}, {"key": "37160199", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254179267199, "ground_truth": 0}, {"key": "37160199", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.769080228936833, "ground_truth": 0}, {"key": "35891053", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9362850026035047, "ground_truth": 0}, {"key": "35891053", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8962513743340732, "ground_truth": 0}, {"key": "35891053", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9496693707282712, "ground_truth": 0}, {"key": "35891053", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797037803863, "ground_truth": 0}, {"key": "35891053", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105453948194596, "ground_truth": 0}, {"key": "40694542", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.49023560446930214, "ground_truth": 0}, {"key": "40694542", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4513264974300536, "ground_truth": 0}, {"key": "40694542", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6206215918093402, "ground_truth": 0}, {"key": "40694542", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241490745025, "ground_truth": 0}, {"key": "40694542", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984786799336, "ground_truth": 0}, {"key": "24645770", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.72174319660892, "ground_truth": 0}, {"key": "24645770", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7185944122438129, "ground_truth": 0}, {"key": "24645770", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7892337122391905, "ground_truth": 0}, {"key": "24645770", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493160432651, "ground_truth": 0}, {"key": "24645770", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197796048433, "ground_truth": 0}, {"key": "37974587", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.90122741187546, "ground_truth": 0}, {"key": "37974587", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8864204034302271, "ground_truth": 0}, {"key": "37974587", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8688267847868305, "ground_truth": 0}, {"key": "37974587", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711711682268, "ground_truth": 0}, {"key": "37974587", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797748724062, "ground_truth": 0}, {"key": "40354149", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407825800353215, "ground_truth": 0}, {"key": "40354149", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.915507240875979, "ground_truth": 0}, {"key": "40354149", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9118099489800864, "ground_truth": 0}, {"key": "40354149", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578509631068, "ground_truth": 0}, {"key": "40354149", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748560953083, "ground_truth": 0}, {"key": "35519470", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5292634032350081, "ground_truth": 0}, {"key": "35519470", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5078118704100714, "ground_truth": 0}, {"key": "35519470", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.3468730663958516, "ground_truth": 0}, {"key": "35519470", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544705034340195, "ground_truth": 0}, {"key": "35519470", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643962637995, "ground_truth": 0}, {"key": "36185624", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.787931209139913, "ground_truth": 0}, {"key": "36185624", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.831143050642809, "ground_truth": 0}, {"key": "36185624", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8879840462968847, "ground_truth": 0}, {"key": "36185624", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306404552572, "ground_truth": 0}, {"key": "36185624", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943685444268, "ground_truth": 0}, {"key": "39306113", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6706082555927771, "ground_truth": 0}, {"key": "39306113", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6113819692772547, "ground_truth": 0}, {"key": "39306113", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8068526306188142, "ground_truth": 0}, {"key": "39306113", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307884031704, "ground_truth": 0}, {"key": "39306113", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241882252069, "ground_truth": 0}, {"key": "19347718", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6001883749036058, "ground_truth": 0}, {"key": "19347718", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5679366279460581, "ground_truth": 0}, {"key": "19347718", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6334102730485107, "ground_truth": 0}, {"key": "19347718", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253796342192, "ground_truth": 0}, {"key": "19347718", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740044477179, "ground_truth": 0}, {"key": "21870064", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6601723706639956, "ground_truth": 0}, {"key": "21870064", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5907791982461689, "ground_truth": 0}, {"key": "21870064", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5409238830529263, "ground_truth": 0}, {"key": "21870064", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365969301259, "ground_truth": 0}, {"key": "21870064", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089341671483, "ground_truth": 0}, {"key": "37675776", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9425067299301297, "ground_truth": 0}, {"key": "37675776", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9485372369593219, "ground_truth": 0}, {"key": "37675776", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9390248206959848, "ground_truth": 0}, {"key": "37675776", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9469902274960353, "ground_truth": 0}, {"key": "37675776", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582587914341, "ground_truth": 0}, {"key": "38107017", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6406358408119083, "ground_truth": 0}, {"key": "38107017", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7264256275862909, "ground_truth": 0}, {"key": "38107017", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7201715019550443, "ground_truth": 0}, {"key": "38107017", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238476982183, "ground_truth": 0}, {"key": "38107017", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416561699156, "ground_truth": 0}, {"key": "40046472", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6001883629770446, "ground_truth": 0}, {"key": "40046472", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6113819641955776, "ground_truth": 0}, {"key": "40046472", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5945512350186158, "ground_truth": 0}, {"key": "40046472", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646055466631, "ground_truth": 0}, {"key": "40046472", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.43782349964240946, "ground_truth": 0}, {"key": "32157820", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897372030083, "ground_truth": 0}, {"key": "32157820", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8469578469700249, "ground_truth": 0}, {"key": "32157820", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7264256047127782, "ground_truth": 0}, {"key": "32157820", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837831253904, "ground_truth": 0}, {"key": "32157820", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253497835691, "ground_truth": 0}, {"key": "41004037", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7295198030427669, "ground_truth": 0}, {"key": "41004037", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998566179776, "ground_truth": 0}, {"key": "41004037", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7041601526201373, "ground_truth": 0}, {"key": "41004037", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528025766675, "ground_truth": 0}, {"key": "41004037", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849534323733, "ground_truth": 0}, {"key": "21387993", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7310585732093634, "ground_truth": 0}, {"key": "21387993", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8006920078401145, "ground_truth": 0}, {"key": "21387993", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358216687857, "ground_truth": 0}, {"key": "21387993", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432021902592, "ground_truth": 0}, {"key": "21387993", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789174798105, "ground_truth": 0}, {"key": "34665539", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6992544310381269, "ground_truth": 0}, {"key": "34665539", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7295198049843914, "ground_truth": 0}, {"key": "34665539", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6370307811112096, "ground_truth": 0}, {"key": "34665539", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920151231018, "ground_truth": 0}, {"key": "34665539", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998606447706, "ground_truth": 0}, {"key": "37872111", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6825737050158087, "ground_truth": 0}, {"key": "37872111", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6566583036542271, "ground_truth": 0}, {"key": "37872111", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228228897174, "ground_truth": 0}, {"key": "37872111", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804786717288886, "ground_truth": 0}, {"key": "37872111", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321781593139, "ground_truth": 0}, {"key": "36629542", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8489721999212696, "ground_truth": 0}, {"key": "36629542", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163861208671, "ground_truth": 0}, {"key": "36629542", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8407825925946468, "ground_truth": 0}, {"key": "36629542", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493182242252, "ground_truth": 0}, {"key": "36629542", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526262652808, "ground_truth": 0}, {"key": "36487527", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8749346287694866, "ground_truth": 0}, {"key": "36487527", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7074047043662745, "ground_truth": 0}, {"key": "36487527", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9046505385868849, "ground_truth": 0}, {"key": "36487527", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625200584899, "ground_truth": 0}, {"key": "36487527", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549519537424, "ground_truth": 0}, {"key": "37344756", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9433475766138989, "ground_truth": 0}, {"key": "37344756", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8615382035938928, "ground_truth": 0}, {"key": "37344756", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9299510347344603, "ground_truth": 0}, {"key": "37344756", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256488529445, "ground_truth": 0}, {"key": "37344756", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9676556675387459, "ground_truth": 0}, {"key": "38707722", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876300123386616, "ground_truth": 0}, {"key": "38707722", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754406392366, "ground_truth": 0}, {"key": "38707722", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.692641978714026, "ground_truth": 0}, {"key": "38707722", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786204944018, "ground_truth": 0}, {"key": "38707722", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.73259184049887, "ground_truth": 0}, {"key": "37093419", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6297745829643232, "ground_truth": 0}, {"key": "37093419", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.35398630087816363, "ground_truth": 0}, {"key": "37093419", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6224593270455234, "ground_truth": 0}, {"key": "37093419", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307914660692, "ground_truth": 0}, {"key": "37093419", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089174023079, "ground_truth": 0}, {"key": "35547391", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.832236656312586, "ground_truth": 0}, {"key": "35547391", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7918210734458454, "ground_truth": 0}, {"key": "35547391", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6076632093571726, "ground_truth": 0}, {"key": "35547391", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253729012097, "ground_truth": 0}, {"key": "35547391", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.763483753192091, "ground_truth": 0}, {"key": "37173168", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256512744957, "ground_truth": 0}, {"key": "37173168", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.810478908092521, "ground_truth": 0}, {"key": "37173168", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059331760105, "ground_truth": 0}, {"key": "37173168", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711736057228, "ground_truth": 0}, {"key": "37173168", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.880797074541988, "ground_truth": 0}, {"key": "30725298", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7634837742326268, "ground_truth": 0}, {"key": "30725298", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7592254306904039, "ground_truth": 0}, {"key": "30725298", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506495925738, "ground_truth": 0}, {"key": "30725298", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118990417417, "ground_truth": 0}, {"key": "30725298", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311915470295, "ground_truth": 0}, {"key": "33830573", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9130583508322112, "ground_truth": 0}, {"key": "33830573", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8606036235140289, "ground_truth": 0}, {"key": "33830573", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9241418235303726, "ground_truth": 0}, {"key": "33830573", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145767506164, "ground_truth": 0}, {"key": "33830573", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759879393588, "ground_truth": 0}, {"key": "33415474", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5486735035316261, "ground_truth": 0}, {"key": "33415474", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5078118796346778, "ground_truth": 0}, {"key": "33415474", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5409238713150215, "ground_truth": 0}, {"key": "33415474", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684695873063, "ground_truth": 0}, {"key": "33415474", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241708050344, "ground_truth": 0}, {"key": "37383994", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8879840454674222, "ground_truth": 0}, {"key": "37383994", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9257686324894049, "ground_truth": 0}, {"key": "37383994", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9252299636622527, "ground_truth": 0}, {"key": "37383994", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9372107908643166, "ground_truth": 0}, {"key": "37383994", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9556514239380375, "ground_truth": 0}, {"key": "38576819", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8633915961589994, "ground_truth": 0}, {"key": "38576819", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8933094052427247, "ground_truth": 0}, {"key": "38576819", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9329437174321205, "ground_truth": 0}, {"key": "38576819", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9173026601801201, "ground_truth": 0}, {"key": "38576819", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666594663354, "ground_truth": 0}, {"key": "34500226", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745833723206158, "ground_truth": 0}, {"key": "34500226", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624778647243, "ground_truth": 0}, {"key": "34500226", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7648916148317377, "ground_truth": 0}, {"key": "34500226", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435008805788, "ground_truth": 0}, {"key": "34500226", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.852935472144927, "ground_truth": 0}, {"key": "39856394", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7620700956762774, "ground_truth": 0}, {"key": "39856394", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7606506566741251, "ground_truth": 0}, {"key": "39856394", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307599415503, "ground_truth": 0}, {"key": "39856394", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.750552774244343, "ground_truth": 0}, {"key": "39856394", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089292762966, "ground_truth": 0}, {"key": "35499522", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5755880143729327, "ground_truth": 0}, {"key": "35499522", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6636689587597026, "ground_truth": 0}, {"key": "35499522", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6808785969158859, "ground_truth": 0}, {"key": "35499522", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191261528369, "ground_truth": 0}, {"key": "35499522", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872021445516, "ground_truth": 0}, {"key": "30157766", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835318039858, "ground_truth": 0}, {"key": "30157766", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127557920558, "ground_truth": 0}, {"key": "30157766", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8092759833133677, "ground_truth": 0}, {"key": "30157766", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338296032808, "ground_truth": 0}, {"key": "30157766", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278619026733, "ground_truth": 0}, {"key": "40472346", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8606036346010822, "ground_truth": 0}, {"key": "40472346", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7918210612783695, "ground_truth": 0}, {"key": "40472346", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8221891207335772, "ground_truth": 0}, {"key": "40472346", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647978568046, "ground_truth": 0}, {"key": "40472346", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306306039415, "ground_truth": 0}, {"key": "35305635", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8233284045687136, "ground_truth": 0}, {"key": "35305635", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8221891539701703, "ground_truth": 0}, {"key": "35305635", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9005297861461171, "ground_truth": 0}, {"key": "35305635", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743701826478, "ground_truth": 0}, {"key": "35305635", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.858718588844867, "ground_truth": 0}, {"key": "32495926", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7786493167264993, "ground_truth": 0}, {"key": "32495926", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.677474005914408, "ground_truth": 0}, {"key": "32495926", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140527946852346, "ground_truth": 0}, {"key": "32495926", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068887817911, "ground_truth": 0}, {"key": "32495926", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.769080250516329, "ground_truth": 0}, {"key": "37353801", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648916260570158, "ground_truth": 0}, {"key": "37353801", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6636689609715294, "ground_truth": 0}, {"key": "37353801", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7690802347057232, "ground_truth": 0}, {"key": "37353801", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094697751365, "ground_truth": 0}, {"key": "37353801", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434888976071, "ground_truth": 0}, {"key": "30159904", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745833816120653, "ground_truth": 0}, {"key": "30159904", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850211947133, "ground_truth": 0}, {"key": "30159904", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7217432315050624, "ground_truth": 0}, {"key": "30159904", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.799442338485302, "ground_truth": 0}, {"key": "30159904", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.817574482690836, "ground_truth": 0}, {"key": "33698679", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6926419770589052, "ground_truth": 0}, {"key": "33698679", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6531269360478403, "ground_truth": 0}, {"key": "33698679", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6757646184238681, "ground_truth": 0}, {"key": "33698679", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802292169633, "ground_truth": 0}, {"key": "33698679", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916097309277, "ground_truth": 0}, {"key": "40530172", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9079671373702322, "ground_truth": 0}, {"key": "40530172", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528080585652, "ground_truth": 0}, {"key": "40530172", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9032942159388332, "ground_truth": 0}, {"key": "40530172", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063807752051, "ground_truth": 0}, {"key": "40530172", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942338454762, "ground_truth": 0}, {"key": "40652941", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.835483538426085, "ground_truth": 0}, {"key": "40652941", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.821044102693122, "ground_truth": 0}, {"key": "40652941", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8832359904807776, "ground_truth": 0}, {"key": "40652941", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998547233383, "ground_truth": 0}, {"key": "40652941", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797411585112, "ground_truth": 0}, {"key": "40122246", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8606036242283717, "ground_truth": 0}, {"key": "40122246", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581687224849, "ground_truth": 0}, {"key": "40122246", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835428040823, "ground_truth": 0}, {"key": "40122246", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891319384972, "ground_truth": 0}, {"key": "40122246", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715063949262, "ground_truth": 0}, {"key": "40032656", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8479677543911464, "ground_truth": 0}, {"key": "40032656", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8887587860560271, "ground_truth": 0}, {"key": "40032656", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8962513774515066, "ground_truth": 0}, {"key": "40032656", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377638209174, "ground_truth": 0}, {"key": "40032656", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675406881425, "ground_truth": 0}, {"key": "38913680", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6688802592560866, "ground_truth": 0}, {"key": "38913680", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6187804252505393, "ground_truth": 0}, {"key": "38913680", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6150878270688139, "ground_truth": 0}, {"key": "38913680", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419789618682, "ground_truth": 0}, {"key": "38913680", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.566018537067392, "ground_truth": 0}, {"key": "17608039", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6132365435162458, "ground_truth": 0}, {"key": "17608039", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6261241569075231, "ground_truth": 0}, {"key": "17608039", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5136684694224533, "ground_truth": 0}, {"key": "17608039", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.642432470828989, "ground_truth": 0}, {"key": "17608039", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218813774149467, "ground_truth": 0}, {"key": "40434901", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.799442313507019, "ground_truth": 0}, {"key": "40434901", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511543889765, "ground_truth": 0}, {"key": "40434901", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.845942444676822, "ground_truth": 0}, {"key": "40434901", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210821260454, "ground_truth": 0}, {"key": "40434901", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918318783438, "ground_truth": 0}, {"key": "37680058", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.40733340442730753, "ground_truth": 0}, {"key": "37680058", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.3923368667430371, "ground_truth": 0}, {"key": "37680058", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.43398148384103175, "ground_truth": 0}, {"key": "37680058", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937837582100764, "ground_truth": 0}, {"key": "37680058", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748970626454, "ground_truth": 0}, {"key": "37291821", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6992544229083381, "ground_truth": 0}, {"key": "37291821", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6150878530158784, "ground_truth": 0}, {"key": "37291821", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5717665894950543, "ground_truth": 0}, {"key": "37291821", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601418614418, "ground_truth": 0}, {"key": "37291821", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512086584847, "ground_truth": 0}, {"key": "41002743", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8031738087645013, "ground_truth": 0}, {"key": "41002743", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8365545576349597, "ground_truth": 0}, {"key": "41002743", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8840392956880371, "ground_truth": 0}, {"key": "41002743", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354823046144, "ground_truth": 0}, {"key": "41002743", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952959759466, "ground_truth": 0}, {"key": "36322869", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9092645132711323, "ground_truth": 0}, {"key": "36322869", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9005297801164835, "ground_truth": 0}, {"key": "36322869", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358264543855, "ground_truth": 0}, {"key": "36322869", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511517140365, "ground_truth": 0}, {"key": "36322869", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210634381495, "ground_truth": 0}, {"key": "39459717", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9202179909327608, "ground_truth": 0}, {"key": "39459717", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8311430325563984, "ground_truth": 0}, {"key": "39459717", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8807970672809271, "ground_truth": 0}, {"key": "39459717", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745175743898, "ground_truth": 0}, {"key": "39459717", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772243936562, "ground_truth": 0}, {"key": "36503727", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6619228640457727, "ground_truth": 0}, {"key": "36503727", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.660172384014402, "ground_truth": 0}, {"key": "36503727", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5926666037691105, "ground_truth": 0}, {"key": "36503727", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.583203363665734, "ground_truth": 0}, {"key": "36503727", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526631109476, "ground_truth": 0}, {"key": "35682367", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7879311916954966, "ground_truth": 0}, {"key": "35682367", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7648916261945761, "ground_truth": 0}, {"key": "35682367", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6584174933576649, "ground_truth": 0}, {"key": "35682367", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047098629921, "ground_truth": 0}, {"key": "35682367", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666562458757, "ground_truth": 0}, {"key": "36472353", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7461389948403329, "ground_truth": 0}, {"key": "36472353", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7295197571477265, "ground_truth": 0}, {"key": "36472353", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7264255996012919, "ground_truth": 0}, {"key": "36472353", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849436514553, "ground_truth": 0}, {"key": "36472353", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307564257488, "ground_truth": 0}, {"key": "37651907", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.790530309138096, "ground_truth": 0}, {"key": "37651907", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5698526578507077, "ground_truth": 0}, {"key": "37651907", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7279754234678423, "ground_truth": 0}, {"key": "37651907", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.754915004833792, "ground_truth": 0}, {"key": "37651907", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563318112497, "ground_truth": 0}, {"key": "36255476", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7122321755926826, "ground_truth": 0}, {"key": "36255476", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6859494586779554, "ground_truth": 0}, {"key": "36255476", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7943849687079829, "ground_truth": 0}, {"key": "36255476", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117785748834, "ground_truth": 0}, {"key": "36255476", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210766533798, "ground_truth": 0}, {"key": "37283518", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8955226776180363, "ground_truth": 0}, {"key": "37283518", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9268352737161858, "ground_truth": 0}, {"key": "37283518", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338427604604, "ground_truth": 0}, {"key": "37283518", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185785423987, "ground_truth": 0}, {"key": "37283518", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9111797081168717, "ground_truth": 0}, {"key": "34906785", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7520125746736877, "ground_truth": 0}, {"key": "34906785", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8774767887713966, "ground_truth": 0}, {"key": "34906785", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7248702866410547, "ground_truth": 0}, {"key": "34906785", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.836554544266327, "ground_truth": 0}, {"key": "34906785", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.741674020384252, "ground_truth": 0}, {"key": "34965328", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8872045954395547, "ground_truth": 0}, {"key": "34965328", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9059898162908393, "ground_truth": 0}, {"key": "34965328", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8879840569830011, "ground_truth": 0}, {"key": "34965328", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199605476481, "ground_truth": 0}, {"key": "34965328", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267818705551, "ground_truth": 0}, {"key": "38788440", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.712232188494459, "ground_truth": 0}, {"key": "38788440", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.762070095642233, "ground_truth": 0}, {"key": "38788440", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191412531864, "ground_truth": 0}, {"key": "38788440", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300556340334, "ground_truth": 0}, {"key": "38788440", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983122143995208, "ground_truth": 0}, {"key": "35046866", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8688267605618866, "ground_truth": 0}, {"key": "35046866", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7799928878522191, "ground_truth": 0}, {"key": "35046866", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631528626502, "ground_truth": 0}, {"key": "35046866", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210628958846, "ground_truth": 0}, {"key": "35046866", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840415509327, "ground_truth": 0}, {"key": "37629558", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5525396851476794, "ground_truth": 0}, {"key": "37629558", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6388352804001297, "ground_truth": 0}, {"key": "37629558", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6460137032353654, "ground_truth": 0}, {"key": "37629558", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312094001318, "ground_truth": 0}, {"key": "37629558", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199074294046, "ground_truth": 0}, {"key": "33859914", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.800692017295519, "ground_truth": 0}, {"key": "33859914", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.812867313548281, "ground_truth": 0}, {"key": "33859914", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631590022466, "ground_truth": 0}, {"key": "33859914", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867872217777, "ground_truth": 0}, {"key": "33859914", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416419200741, "ground_truth": 0}, {"key": "39790523", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8887587972286365, "ground_truth": 0}, {"key": "39790523", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8044059195226058, "ground_truth": 0}, {"key": "39790523", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8539127662733521, "ground_truth": 0}, {"key": "39790523", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897262614514, "ground_truth": 0}, {"key": "39790523", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187368042967249, "ground_truth": 0}, {"key": "33509656", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5774953724388843, "ground_truth": 0}, {"key": "33509656", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159625812123, "ground_truth": 0}, {"key": "33509656", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388215420785, "ground_truth": 0}, {"key": "33509656", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284176865573, "ground_truth": 0}, {"key": "33509656", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306406535709, "ground_truth": 0}, {"key": "17380923", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8397339563520971, "ground_truth": 0}, {"key": "17380923", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840469907894, "ground_truth": 0}, {"key": "17380923", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.892562525074214, "ground_truth": 0}, {"key": "17380923", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063816046062, "ground_truth": 0}, {"key": "17380923", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281678675681, "ground_truth": 0}, {"key": "36202526", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5774953976410463, "ground_truth": 0}, {"key": "36202526", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872105723952, "ground_truth": 0}, {"key": "36202526", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.720171488950003, "ground_truth": 0}, {"key": "36202526", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085710881177, "ground_truth": 0}, {"key": "36202526", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919889082912, "ground_truth": 0}, {"key": "26419232", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7431679913851088, "ground_truth": 0}, {"key": "26419232", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7634837800611262, "ground_truth": 0}, {"key": "26419232", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7122321805097038, "ground_truth": 0}, {"key": "26419232", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624746125396, "ground_truth": 0}, {"key": "26419232", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253673427401, "ground_truth": 0}, {"key": "34232398", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.738669082940562, "ground_truth": 0}, {"key": "34232398", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8969755647222941, "ground_truth": 0}, {"key": "34232398", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6842640355819333, "ground_truth": 0}, {"key": "34232398", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528129666911, "ground_truth": 0}, {"key": "34232398", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754413483803, "ground_truth": 0}, {"key": "33586045", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8198933120674521, "ground_truth": 0}, {"key": "33586045", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7839884864757672, "ground_truth": 0}, {"key": "33586045", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7826624867831539, "ground_truth": 0}, {"key": "33586045", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416739975659553, "ground_truth": 0}, {"key": "33586045", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432165482661, "ground_truth": 0}, {"key": "32281151", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.72797544784181, "ground_truth": 0}, {"key": "32281151", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7786493162517795, "ground_truth": 0}, {"key": "32281151", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7325918310552226, "ground_truth": 0}, {"key": "32281151", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306272020556, "ground_truth": 0}, {"key": "32281151", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891376559772, "ground_truth": 0}, {"key": "37308159", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9184802423505932, "ground_truth": 0}, {"key": "37308159", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9334308072554904, "ground_truth": 0}, {"key": "37308159", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9149009540721025, "ground_truth": 0}, {"key": "37308159", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9559813465160932, "ground_truth": 0}, {"key": "37308159", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772216369688, "ground_truth": 0}, {"key": "35694408", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7386690754958077, "ground_truth": 0}, {"key": "35694408", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8864204119670552, "ground_truth": 0}, {"key": "35694408", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8661325171168293, "ground_truth": 0}, {"key": "35694408", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424467988096, "ground_truth": 0}, {"key": "35694408", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159534266261, "ground_truth": 0}, {"key": "39781995", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7356416547462402, "ground_truth": 0}, {"key": "39781995", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7799928933196634, "ground_truth": 0}, {"key": "39781995", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8092759458686987, "ground_truth": 0}, {"key": "39781995", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445389095714, "ground_truth": 0}, {"key": "39781995", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.727975429394987, "ground_truth": 0}, {"key": "22799372", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9309620709577221, "ground_truth": 0}, {"key": "22799372", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9559813508807784, "ground_truth": 0}, {"key": "22799372", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9465966716155049, "ground_truth": 0}, {"key": "22799372", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9818752779765296, "ground_truth": 0}, {"key": "22799372", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9740426421621431, "ground_truth": 0}, {"key": "37428240", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6297746203002224, "ground_truth": 0}, {"key": "37428240", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.66192287762535, "ground_truth": 0}, {"key": "37428240", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.588889131217802, "ground_truth": 0}, {"key": "37428240", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163502435084, "ground_truth": 0}, {"key": "37428240", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512617764608, "ground_truth": 0}, {"key": "40612657", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.902609601780803, "ground_truth": 0}, {"key": "40612657", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9190632917745046, "ground_truth": 0}, {"key": "40612657", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8918110485377666, "ground_truth": 0}, {"key": "40612657", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898203315332, "ground_truth": 0}, {"key": "40612657", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218387841225, "ground_truth": 0}, {"key": "34404662", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.769080250981475, "ground_truth": 0}, {"key": "34404662", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8031738017203196, "ground_truth": 0}, {"key": "34404662", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8925625226297909, "ground_truth": 0}, {"key": "34404662", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9092645202128794, "ground_truth": 0}, {"key": "34404662", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215374583786, "ground_truth": 0}, {"key": "32619704", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849542361128, "ground_truth": 0}, {"key": "32619704", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581708224478, "ground_truth": 0}, {"key": "32619704", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7813306210517077, "ground_truth": 0}, {"key": "32619704", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619200099028, "ground_truth": 0}, {"key": "32619704", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163737794197, "ground_truth": 0}, {"key": "39014883", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7008948178332627, "ground_truth": 0}, {"key": "39014883", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.695958355788763, "ground_truth": 0}, {"key": "39014883", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.654894732242651, "ground_truth": 0}, {"key": "39014883", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787234996579, "ground_truth": 0}, {"key": "39014883", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339659246685, "ground_truth": 0}, {"key": "37982812", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9449947182549266, "ground_truth": 0}, {"key": "37982812", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.957596172312374, "ground_truth": 0}, {"key": "37982812", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9343951642545406, "ground_truth": 0}, {"key": "37982812", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9518632312743941, "ground_truth": 0}, {"key": "37982812", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9686195680687902, "ground_truth": 0}, {"key": "28123476", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8705972576338489, "ground_truth": 0}, {"key": "28123476", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7981867730197669, "ground_truth": 0}, {"key": "28123476", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8714748663916665, "ground_truth": 0}, {"key": "28123476", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240769922217, "ground_truth": 0}, {"key": "28123476", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314733095656, "ground_truth": 0}, {"key": "39078849", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5486735079160243, "ground_truth": 0}, {"key": "39078849", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7549150040362342, "ground_truth": 0}, {"key": "39078849", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059166286791, "ground_truth": 0}, {"key": "39078849", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581528745109, "ground_truth": 0}, {"key": "39078849", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754532497682, "ground_truth": 0}, {"key": "39414137", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9744347868902211, "ground_truth": 0}, {"key": "39414137", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9763105280389702, "ground_truth": 0}, {"key": "39414137", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9777138122124833, "ground_truth": 0}, {"key": "39414137", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9746286908355094, "ground_truth": 0}, {"key": "39414137", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9750122054686879, "ground_truth": 0}, {"key": "37371354", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6388352581461773, "ground_truth": 0}, {"key": "37371354", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8210441236794456, "ground_truth": 0}, {"key": "37371354", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6334102730989999, "ground_truth": 0}, {"key": "37371354", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582795570078, "ground_truth": 0}, {"key": "37371354", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615824626631, "ground_truth": 0}, {"key": "29497179", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8221891446163286, "ground_truth": 0}, {"key": "29497179", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7138307636390434, "ground_truth": 0}, {"key": "29497179", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7879311955813741, "ground_truth": 0}, {"key": "29497179", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837654982038, "ground_truth": 0}, {"key": "29497179", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575593095613, "ground_truth": 0}, {"key": "35908694", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.94417686541749, "ground_truth": 0}, {"key": "35908694", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9588471129495367, "ground_truth": 0}, {"key": "35908694", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9621075715387256, "ground_truth": 0}, {"key": "35908694", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9603611639077706, "ground_truth": 0}, {"key": "35908694", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9511422170787015, "ground_truth": 0}, {"key": "37619358", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849591211398, "ground_truth": 0}, {"key": "37619358", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8080672232688553, "ground_truth": 0}, {"key": "37619358", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7341195440639002, "ground_truth": 0}, {"key": "37619358", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435038243711, "ground_truth": 0}, {"key": "37619358", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872223396023, "ground_truth": 0}, {"key": "37293103", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8714748522846687, "ground_truth": 0}, {"key": "37293103", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933501557877, "ground_truth": 0}, {"key": "37293103", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8489722100824635, "ground_truth": 0}, {"key": "37293103", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9362850088410756, "ground_truth": 0}, {"key": "37293103", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9543079669488018, "ground_truth": 0}, {"key": "36883729", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8918110463300201, "ground_truth": 0}, {"key": "36883729", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8489721962533051, "ground_truth": 0}, {"key": "36883729", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7813306372944344, "ground_truth": 0}, {"key": "36883729", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430363006321, "ground_truth": 0}, {"key": "36883729", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493152565427, "ground_truth": 0}, {"key": "39209521", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289388052523297, "ground_truth": 0}, {"key": "39209521", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8278281520063392, "ground_truth": 0}, {"key": "39209521", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.896251379946613, "ground_truth": 0}, {"key": "39209521", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519527990828857, "ground_truth": 0}, {"key": "39209521", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222862666062, "ground_truth": 0}, {"key": "27792571", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7295197793052479, "ground_truth": 0}, {"key": "27792571", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7401743454695447, "ground_truth": 0}, {"key": "27792571", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191428575889, "ground_truth": 0}, {"key": "27792571", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835424332117, "ground_truth": 0}, {"key": "27792571", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998599463118, "ground_truth": 0}, {"key": "39755647", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8344068976847303, "ground_truth": 0}, {"key": "39755647", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8428631473541305, "ground_truth": 0}, {"key": "39755647", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8255897383639861, "ground_truth": 0}, {"key": "39755647", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300550122316, "ground_truth": 0}, {"key": "39755647", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228077953297, "ground_truth": 0}, {"key": "40800537", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.4532618470312244, "ground_truth": 0}, {"key": "40800537", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5794003979516628, "ground_truth": 0}, {"key": "40800537", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5621764927751985, "ground_truth": 0}, {"key": "40800537", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118813416941, "ground_truth": 0}, {"key": "40800537", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308100185513, "ground_truth": 0}, {"key": "14171461", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5851011472105268, "ground_truth": 0}, {"key": "14171461", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5926665901847715, "ground_truth": 0}, {"key": "14171461", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094704956716, "ground_truth": 0}, {"key": "14171461", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269037493104, "ground_truth": 0}, {"key": "14171461", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.756357560135433, "ground_truth": 0}, {"key": "36892440", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7233094711469397, "ground_truth": 0}, {"key": "36892440", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7745833964319344, "ground_truth": 0}, {"key": "36892440", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7994423140269968, "ground_truth": 0}, {"key": "36892440", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424221579795, "ground_truth": 0}, {"key": "36892440", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721852568755, "ground_truth": 0}, {"key": "33733410", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8661325075786271, "ground_truth": 0}, {"key": "33733410", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.860603609917729, "ground_truth": 0}, {"key": "33733410", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519528040321385, "ground_truth": 0}, {"key": "33733410", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.718594382950825, "ground_truth": 0}, {"key": "33733410", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256510722584, "ground_truth": 0}, {"key": "38587765", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6020616027281169, "ground_truth": 0}, {"key": "38587765", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6076631601560899, "ground_truth": 0}, {"key": "38587765", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.4610167700543767, "ground_truth": 0}, {"key": "38587765", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984457901594, "ground_truth": 0}, {"key": "38587765", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802484384256, "ground_truth": 0}, {"key": "41065582", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835415799718, "ground_truth": 0}, {"key": "41065582", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6943026873574554, "ground_truth": 0}, {"key": "41065582", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8499711785358697, "ground_truth": 0}, {"key": "41065582", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506674688626, "ground_truth": 0}, {"key": "41065582", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.852935481243264, "ground_truth": 0}, {"key": "34713891", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315942953461201, "ground_truth": 0}, {"key": "34713891", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6943026832137305, "ground_truth": 0}, {"key": "34713891", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6926419757303782, "ground_truth": 0}, {"key": "34713891", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690719473793, "ground_truth": 0}, {"key": "34713891", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717665944801898, "ground_truth": 0}, {"key": "18913023", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8991213828561346, "ground_truth": 0}, {"key": "18913023", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9399133517398678, "ground_truth": 0}, {"key": "18913023", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8832359827910383, "ground_truth": 0}, {"key": "18913023", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666542446574, "ground_truth": 0}, {"key": "18913023", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240127279651, "ground_truth": 0}, {"key": "36884100", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.4785288367678965, "ground_truth": 0}, {"key": "36884100", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.48047869306552077, "ground_truth": 0}, {"key": "36884100", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.31742625558321735, "ground_truth": 0}, {"key": "36884100", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711434379016, "ground_truth": 0}, {"key": "36884100", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707365923557978, "ground_truth": 0}, {"key": "39899913", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8479677770663401, "ground_truth": 0}, {"key": "39899913", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8407825864824989, "ground_truth": 0}, {"key": "39899913", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8783142464582965, "ground_truth": 0}, {"key": "39899913", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619253968357, "ground_truth": 0}, {"key": "39899913", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772584847375, "ground_truth": 0}, {"key": "30725366", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.4921881606397976, "ground_truth": 0}, {"key": "30725366", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6279512124070282, "ground_truth": 0}, {"key": "30725366", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5409238845700536, "ground_truth": 0}, {"key": "30725366", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358384960325, "ground_truth": 0}, {"key": "30725366", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056128628912, "ground_truth": 0}, {"key": "26133523", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8031738046625231, "ground_truth": 0}, {"key": "26133523", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5448014057292164, "ground_truth": 0}, {"key": "26133523", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7648916172501223, "ground_truth": 0}, {"key": "26133523", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056209919525, "ground_truth": 0}, {"key": "26133523", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210812149707, "ground_truth": 0}, {"key": "29332665", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835353916186, "ground_truth": 0}, {"key": "29332665", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8606036185480241, "ground_truth": 0}, {"key": "29332665", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7264256088231515, "ground_truth": 0}, {"key": "29332665", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802272239389, "ground_truth": 0}, {"key": "29332665", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786322098381, "ground_truth": 0}, {"key": "37400481", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8918110373371296, "ground_truth": 0}, {"key": "37400481", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9412234442470522, "ground_truth": 0}, {"key": "37400481", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9358173563986913, "ground_truth": 0}, {"key": "37400481", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9213576209605967, "ground_truth": 0}, {"key": "37400481", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099446608082, "ground_truth": 0}, {"key": "38787241", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6370307912299303, "ground_truth": 0}, {"key": "38787241", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7969253697182774, "ground_truth": 0}, {"key": "38787241", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7371581648579392, "ground_truth": 0}, {"key": "38787241", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122783072486, "ground_truth": 0}, {"key": "38787241", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089302457774, "ground_truth": 0}, {"key": "38225963", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6020616161473653, "ground_truth": 0}, {"key": "38225963", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872046548726, "ground_truth": 0}, {"key": "38225963", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6460136990289288, "ground_truth": 0}, {"key": "38225963", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849681968925, "ground_truth": 0}, {"key": "38225963", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059552349723, "ground_truth": 0}, {"key": "26072034", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5175708621211765, "ground_truth": 0}, {"key": "26072034", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4016878092616831, "ground_truth": 0}, {"key": "26072034", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5832033737273601, "ground_truth": 0}, {"key": "26072034", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487214138514, "ground_truth": 0}, {"key": "26072034", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030940471242, "ground_truth": 0}, {"key": "35690810", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7505527684623639, "ground_truth": 0}, {"key": "35690810", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8749346190232493, "ground_truth": 0}, {"key": "35690810", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7745833939134957, "ground_truth": 0}, {"key": "35690810", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128672981402995, "ground_truth": 0}, {"key": "35690810", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241609444156, "ground_truth": 0}, {"key": "36855665", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9681411443187261, "ground_truth": 0}, {"key": "36855665", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9603611598040915, "ground_truth": 0}, {"key": "36855665", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9626731160290783, "ground_truth": 0}, {"key": "36855665", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067271780571, "ground_truth": 0}, {"key": "36855665", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.953966095053945, "ground_truth": 0}, {"key": "29757662", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6688802731981831, "ground_truth": 0}, {"key": "29757662", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909762914966739, "ground_truth": 0}, {"key": "29757662", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6242935506840074, "ground_truth": 0}, {"key": "29757662", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891297787565, "ground_truth": 0}, {"key": "29757662", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762992930424, "ground_truth": 0}, {"key": "19134339", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7956580806024754, "ground_truth": 0}, {"key": "19134339", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.684264038600912, "ground_truth": 0}, {"key": "19134339", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.627951226433028, "ground_truth": 0}, {"key": "19134339", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307645724119, "ground_truth": 0}, {"key": "19134339", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047092245409, "ground_truth": 0}, {"key": "35360732", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9124361548264112, "ground_truth": 0}, {"key": "35360732", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9099069969773624, "ground_truth": 0}, {"key": "35360732", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9358173569723274, "ground_truth": 0}, {"key": "35360732", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053222901643693, "ground_truth": 0}, {"key": "35360732", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424411150379, "ground_truth": 0}, {"key": "37713629", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.552539684841501, "ground_truth": 0}, {"key": "37713629", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159688175522, "ground_truth": 0}, {"key": "37713629", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6224593303726258, "ground_truth": 0}, {"key": "37713629", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632158087281236, "ground_truth": 0}, {"key": "37713629", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093747493014, "ground_truth": 0}, {"key": "33393394", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8056321681592169, "ground_truth": 0}, {"key": "33393394", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217432023145832, "ground_truth": 0}, {"key": "33393394", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7981867864209946, "ground_truth": 0}, {"key": "33393394", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548547244117, "ground_truth": 0}, {"key": "33393394", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837547192668, "ground_truth": 0}, {"key": "32275837", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9437636590999844, "ground_truth": 0}, {"key": "32275837", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9230391626847757, "ground_truth": 0}, {"key": "32275837", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9458012712253373, "ground_truth": 0}, {"key": "32275837", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797117401877, "ground_truth": 0}, {"key": "32275837", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179906162472, "ground_truth": 0}, {"key": "21458094", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5660185191733283, "ground_truth": 0}, {"key": "21458094", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6076631810642623, "ground_truth": 0}, {"key": "21458094", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7662936554284075, "ground_truth": 0}, {"key": "21458094", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527539689107, "ground_truth": 0}, {"key": "21458094", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494842443112, "ground_truth": 0}, {"key": "40975362", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9339146239829336, "ground_truth": 0}, {"key": "40975362", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9582261207768816, "ground_truth": 0}, {"key": "40975362", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9429286003845935, "ground_truth": 0}, {"key": "40975362", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9485372358906298, "ground_truth": 0}, {"key": "40975362", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218355900906, "ground_truth": 0}, {"key": "35234201", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9136765171440774, "ground_truth": 0}, {"key": "35234201", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8056321908482552, "ground_truth": 0}, {"key": "35234201", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7905303247255044, "ground_truth": 0}, {"key": "35234201", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802277640462, "ground_truth": 0}, {"key": "35234201", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632864752724, "ground_truth": 0}, {"key": "36037573", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7295197775254203, "ground_truth": 0}, {"key": "36037573", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7592254198076542, "ground_truth": 0}, {"key": "36037573", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933420241619, "ground_truth": 0}, {"key": "36037573", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690678385627, "ground_truth": 0}, {"key": "36037573", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441110427921, "ground_truth": 0}, {"key": "30861915", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9059898157842319, "ground_truth": 0}, {"key": "30861915", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8947894667477869, "ground_truth": 0}, {"key": "30861915", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.894051715651663, "ground_truth": 0}, {"key": "30861915", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094088108884, "ground_truth": 0}, {"key": "30861915", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.909907008136344, "ground_truth": 0}, {"key": "40173012", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7931059759220466, "ground_truth": 0}, {"key": "40173012", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754463913138, "ground_truth": 0}, {"key": "40173012", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8092759747401943, "ground_truth": 0}, {"key": "40173012", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738000896492, "ground_truth": 0}, {"key": "40173012", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382198048439, "ground_truth": 0}, {"key": "35100330", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5370413989725876, "ground_truth": 0}, {"key": "35100330", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5428632576865464, "ground_truth": 0}, {"key": "35100330", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5350984197545137, "ground_truth": 0}, {"key": "35100330", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688073108262, "ground_truth": 0}, {"key": "35100330", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185467850695, "ground_truth": 0}, {"key": "37220221", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9606574973980408, "ground_truth": 0}, {"key": "37220221", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9425067210207708, "ground_truth": 0}, {"key": "37220221", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.945801277412078, "ground_truth": 0}, {"key": "37220221", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9437636541189154, "ground_truth": 0}, {"key": "37220221", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372108034190054, "ground_truth": 0}, {"key": "38815218", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9504109780170155, "ground_truth": 0}, {"key": "38815218", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9477691412399468, "ground_truth": 0}, {"key": "38815218", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9309620707561552, "ground_truth": 0}, {"key": "38815218", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037271668432, "ground_truth": 0}, {"key": "38815218", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9661559636513642, "ground_truth": 0}, {"key": "39379109", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7106282871558438, "ground_truth": 0}, {"key": "39379109", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5621765165063947, "ground_truth": 0}, {"key": "39379109", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5389832342882623, "ground_truth": 0}, {"key": "39379109", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.65312691655412, "ground_truth": 0}, {"key": "39379109", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666023064139, "ground_truth": 0}, {"key": "14576125", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.3398276337538243, "ground_truth": 0}, {"key": "14576125", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4301473423854837, "ground_truth": 0}, {"key": "14576125", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.20817892281508596, "ground_truth": 0}, {"key": "14576125", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133094650731825, "ground_truth": 0}, {"key": "14576125", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.2598256222053615, "ground_truth": 0}, {"key": "40814250", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704647873634666, "ground_truth": 0}, {"key": "40814250", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357664913616, "ground_truth": 0}, {"key": "40814250", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7943849589240499, "ground_truth": 0}, {"key": "40814250", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337026943833, "ground_truth": 0}, {"key": "40814250", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916144677924, "ground_truth": 0}, {"key": "36334488", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6242935447923278, "ground_truth": 0}, {"key": "36334488", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.646013701932587, "ground_truth": 0}, {"key": "36334488", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6859494552488955, "ground_truth": 0}, {"key": "36334488", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008947827071857, "ground_truth": 0}, {"key": "36334488", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548548531681, "ground_truth": 0}, {"key": "36888322", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.782662478553922, "ground_truth": 0}, {"key": "36888322", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7563575524412455, "ground_truth": 0}, {"key": "36888322", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8175744656746439, "ground_truth": 0}, {"key": "36888322", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210678649, "ground_truth": 0}, {"key": "36888322", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677514007935, "ground_truth": 0}, {"key": "37318916", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9252299489405565, "ground_truth": 0}, {"key": "37318916", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9299510468624358, "ground_truth": 0}, {"key": "37318916", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9224823341431887, "ground_truth": 0}, {"key": "37318916", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9319595786465004, "ground_truth": 0}, {"key": "37318916", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9481545280185836, "ground_truth": 0}, {"key": "39308700", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7154239792843968, "ground_truth": 0}, {"key": "39308700", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7956580929294323, "ground_truth": 0}, {"key": "39308700", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7662936511256839, "ground_truth": 0}, {"key": "39308700", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.756357568544462, "ground_truth": 0}, {"key": "39308700", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228206501844, "ground_truth": 0}, {"key": "31061543", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104562786293, "ground_truth": 0}, {"key": "31061543", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.832236646070679, "ground_truth": 0}, {"key": "31061543", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8633916023253307, "ground_truth": 0}, {"key": "31061543", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898166567806, "ground_truth": 0}, {"key": "31061543", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711643339183, "ground_truth": 0}, {"key": "37380894", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7918210602455141, "ground_truth": 0}, {"key": "37380894", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8509647117125806, "ground_truth": 0}, {"key": "37380894", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7905303179198816, "ground_truth": 0}, {"key": "37380894", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754612227577, "ground_truth": 0}, {"key": "37380894", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063869236234, "ground_truth": 0}, {"key": "38410139", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7461389988773361, "ground_truth": 0}, {"key": "38410139", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7106283015383522, "ground_truth": 0}, {"key": "38410139", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8255897090023218, "ground_truth": 0}, {"key": "38410139", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919882840321, "ground_truth": 0}, {"key": "38410139", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489722053388407, "ground_truth": 0}, {"key": "35953842", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6791787208863412, "ground_truth": 0}, {"key": "35953842", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7549150010656519, "ground_truth": 0}, {"key": "35953842", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6706082717921569, "ground_truth": 0}, {"key": "35953842", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646096989843, "ground_truth": 0}, {"key": "35953842", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665869311368, "ground_truth": 0}, {"key": "39815663", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6601723816679483, "ground_truth": 0}, {"key": "39815663", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6723316845693238, "ground_truth": 0}, {"key": "39815663", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7106283138897042, "ground_truth": 0}, {"key": "39815663", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.401687795422393, "ground_truth": 0}, {"key": "39815663", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030880174371, "ground_truth": 0}, {"key": "35121432", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8774767891601581, "ground_truth": 0}, {"key": "35121432", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9294404028616511, "ground_truth": 0}, {"key": "35121432", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288352009373, "ground_truth": 0}, {"key": "35121432", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952950302313, "ground_truth": 0}, {"key": "35121432", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314737877414, "ground_truth": 0}, {"key": "21712310", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5888891380637372, "ground_truth": 0}, {"key": "21712310", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.548673509345623, "ground_truth": 0}, {"key": "21712310", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.537041384040279, "ground_truth": 0}, {"key": "21712310", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185434828872, "ground_truth": 0}, {"key": "21712310", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.472683474445105, "ground_truth": 0}, {"key": "37952914", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7248702926149395, "ground_truth": 0}, {"key": "37952914", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7341195131428433, "ground_truth": 0}, {"key": "37952914", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8652240817870878, "ground_truth": 0}, {"key": "37952914", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336931542924, "ground_truth": 0}, {"key": "37952914", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760175629012, "ground_truth": 0}, {"key": "38956779", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8164063729550147, "ground_truth": 0}, {"key": "38956779", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8587185782095879, "ground_truth": 0}, {"key": "38956779", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358440052717, "ground_truth": 0}, {"key": "38956779", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936450351006, "ground_truth": 0}, {"key": "38956779", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527943163927, "ground_truth": 0}, {"key": "36101833", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.785308588205553, "ground_truth": 0}, {"key": "36101833", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624720949004, "ground_truth": 0}, {"key": "36101833", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8732148270715021, "ground_truth": 0}, {"key": "36101833", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.743168002412561, "ground_truth": 0}, {"key": "36101833", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893055941415275, "ground_truth": 0}, {"key": "35544662", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6992544449040193, "ground_truth": 0}, {"key": "35544662", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6842640254353102, "ground_truth": 0}, {"key": "35544662", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7248702592189621, "ground_truth": 0}, {"key": "35544662", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647903189712, "ground_truth": 0}, {"key": "35544662", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.690976288680251, "ground_truth": 0}, {"key": "39759044", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8499711783002115, "ground_truth": 0}, {"key": "39759044", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8019358228022324, "ground_truth": 0}, {"key": "39759044", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8221891303327945, "ground_truth": 0}, {"key": "39759044", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916010238686, "ground_truth": 0}, {"key": "39759044", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339725907744, "ground_truth": 0}, {"key": "39433018", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9105453915627918, "ground_truth": 0}, {"key": "39433018", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9167080737008453, "ground_truth": 0}, {"key": "39433018", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9105453976580432, "ground_truth": 0}, {"key": "39433018", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284095521547, "ground_truth": 0}, {"key": "39433018", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343667009545, "ground_truth": 0}, {"key": "22111959", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7772998548095595, "ground_truth": 0}, {"key": "22111959", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7170118930548821, "ground_truth": 0}, {"key": "22111959", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7718434869871247, "ground_truth": 0}, {"key": "22111959", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102765038785, "ground_truth": 0}, {"key": "22111959", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215349724802, "ground_truth": 0}, {"key": "38210094", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6654105575458937, "ground_truth": 0}, {"key": "38210094", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.42823338175426107, "ground_truth": 0}, {"key": "38210094", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6370308083525835, "ground_truth": 0}, {"key": "38210094", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201715027950153, "ground_truth": 0}, {"key": "38210094", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688347995014, "ground_truth": 0}, {"key": "37675935", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.598312188894989, "ground_truth": 0}, {"key": "37675935", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5736783895857065, "ground_truth": 0}, {"key": "37675935", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6548947349670057, "ground_truth": 0}, {"key": "37675935", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690877292197, "ground_truth": 0}, {"key": "37675935", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585784155234, "ground_truth": 0}, {"key": "35732604", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5621765082930978, "ground_truth": 0}, {"key": "35732604", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5156199023697176, "ground_truth": 0}, {"key": "35732604", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5563995677793874, "ground_truth": 0}, {"key": "35732604", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504667166582, "ground_truth": 0}, {"key": "35732604", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093873840541, "ground_truth": 0}, {"key": "27453212", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7634837570433515, "ground_truth": 0}, {"key": "27453212", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8587185919305275, "ground_truth": 0}, {"key": "27453212", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.851952809827531, "ground_truth": 0}, {"key": "27453212", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036120120356, "ground_truth": 0}, {"key": "27453212", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677590646629, "ground_truth": 0}, {"key": "39910047", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7786493035365006, "ground_truth": 0}, {"key": "39910047", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624934602774, "ground_truth": 0}, {"key": "39910047", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6187804493756626, "ground_truth": 0}, {"key": "39910047", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819617321006, "ground_truth": 0}, {"key": "39910047", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435127128568, "ground_truth": 0}, {"key": "40054265", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6566582957712477, "ground_truth": 0}, {"key": "40054265", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4804786987270427, "ground_truth": 0}, {"key": "40054265", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297746163738343, "ground_truth": 0}, {"key": "40054265", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315390178622, "ground_truth": 0}, {"key": "40054265", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270055868297, "ground_truth": 0}, {"key": "19984615", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8679338461980027, "ground_truth": 0}, {"key": "19984615", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9289263327210541, "ground_truth": 0}, {"key": "19984615", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8418256455539839, "ground_truth": 0}, {"key": "19984615", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.837619981070748, "ground_truth": 0}, {"key": "19984615", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891202691372, "ground_truth": 0}, {"key": "16490806", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.40544873877404963, "ground_truth": 0}, {"key": "16490806", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5832033633280185, "ground_truth": 0}, {"key": "16490806", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5448013863036208, "ground_truth": 0}, {"key": "16490806", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366145107821, "ground_truth": 0}, {"key": "16490806", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880011919612, "ground_truth": 0}, {"key": "36396237", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9481545335381454, "ground_truth": 0}, {"key": "36396237", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8714748628144547, "ground_truth": 0}, {"key": "36396237", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9441768555354805, "ground_truth": 0}, {"key": "36396237", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277789687622, "ground_truth": 0}, {"key": "36396237", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9173026624573701, "ground_truth": 0}, {"key": "40726444", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7853085827187589, "ground_truth": 0}, {"key": "40726444", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9086178936109566, "ground_truth": 0}, {"key": "40726444", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8233284032466808, "ground_truth": 0}, {"key": "40726444", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743685245039, "ground_truth": 0}, {"key": "40726444", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256412672627, "ground_truth": 0}, {"key": "37314826", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7446563213168177, "ground_truth": 0}, {"key": "37314826", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5755879897768422, "ground_truth": 0}, {"key": "37314826", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6723316982501636, "ground_truth": 0}, {"key": "37314826", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689549654343, "ground_truth": 0}, {"key": "37314826", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512266124663, "ground_truth": 0}, {"key": "38506971", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6442251063266412, "ground_truth": 0}, {"key": "38506971", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5602526647058763, "ground_truth": 0}, {"key": "38506971", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7170118727385856, "ground_truth": 0}, {"key": "38506971", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668456140898995, "ground_truth": 0}, {"key": "38506971", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879062577626024, "ground_truth": 0}, {"key": "40699312", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797632196825, "ground_truth": 0}, {"key": "40699312", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8499711611180741, "ground_truth": 0}, {"key": "40699312", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8723473728855169, "ground_truth": 0}, {"key": "40699312", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897156369775, "ground_truth": 0}, {"key": "40699312", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759850312033, "ground_truth": 0}, {"key": "34695474", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445660772373, "ground_truth": 0}, {"key": "34695474", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7416740239825897, "ground_truth": 0}, {"key": "34695474", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7648916067725926, "ground_truth": 0}, {"key": "34695474", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082808193696, "ground_truth": 0}, {"key": "34695474", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365543988637, "ground_truth": 0}, {"key": "36281498", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8969755718186608, "ground_truth": 0}, {"key": "36281498", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9118099498463544, "ground_truth": 0}, {"key": "36281498", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9032941983867193, "ground_truth": 0}, {"key": "36281498", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9600626874884505, "ground_truth": 0}, {"key": "36281498", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.895522674873219, "ground_truth": 0}, {"key": "39558652", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6740504881310216, "ground_truth": 0}, {"key": "39558652", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7341195123843176, "ground_truth": 0}, {"key": "39558652", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7325918352799067, "ground_truth": 0}, {"key": "39558652", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740105595771, "ground_truth": 0}, {"key": "39558652", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125900145298, "ground_truth": 0}, {"key": "37330579", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8092759753390435, "ground_truth": 0}, {"key": "37330579", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7956581010455787, "ground_truth": 0}, {"key": "37330579", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7386690626259016, "ground_truth": 0}, {"key": "37330579", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416739942529218, "ground_truth": 0}, {"key": "37330579", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898470965297, "ground_truth": 0}, {"key": "40547658", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8438951049789788, "ground_truth": 0}, {"key": "40547658", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7879312003178748, "ground_truth": 0}, {"key": "40547658", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.866132524202502, "ground_truth": 0}, {"key": "40547658", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743777090346, "ground_truth": 0}, {"key": "40547658", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637528150162, "ground_truth": 0}, {"key": "37119340", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.629774606718381, "ground_truth": 0}, {"key": "37119340", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6531269167891927, "ground_truth": 0}, {"key": "37119340", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297746217480513, "ground_truth": 0}, {"key": "37119340", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365703341267, "ground_truth": 0}, {"key": "37119340", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850263803953, "ground_truth": 0}, {"key": "35301627", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6477982158842472, "ground_truth": 0}, {"key": "35301627", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.637030774194612, "ground_truth": 0}, {"key": "35301627", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898648926652, "ground_truth": 0}, {"key": "35301627", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578358017085, "ground_truth": 0}, {"key": "35301627", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.872347386865714, "ground_truth": 0}, {"key": "34037168", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7606506576090534, "ground_truth": 0}, {"key": "34037168", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163672093406, "ground_truth": 0}, {"key": "34037168", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431680072463136, "ground_truth": 0}, {"key": "34037168", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.783988468366615, "ground_truth": 0}, {"key": "34037168", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929116698344, "ground_truth": 0}, {"key": "39703862", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9539660972318563, "ground_truth": 0}, {"key": "39703862", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9640516774544119, "ground_truth": 0}, {"key": "39703862", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9546474198119281, "ground_truth": 0}, {"key": "39703862", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.960361159584907, "ground_truth": 0}, {"key": "39703862", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9632305349793358, "ground_truth": 0}, {"key": "16554814", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9284087979099447, "ground_truth": 0}, {"key": "16554814", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9136765200326434, "ground_truth": 0}, {"key": "16554814", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377694326576, "ground_truth": 0}, {"key": "16554814", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.907967141936318, "ground_truth": 0}, {"key": "16554814", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745116710634, "ground_truth": 0}, {"key": "32983099", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.586996416182434, "ground_truth": 0}, {"key": "32983099", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.642432473819846, "ground_truth": 0}, {"key": "32983099", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5175709048399708, "ground_truth": 0}, {"key": "32983099", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633753094756, "ground_truth": 0}, {"key": "32983099", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203265475886, "ground_truth": 0}, {"key": "41072994", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5640984823417746, "ground_truth": 0}, {"key": "41072994", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6206215967748671, "ground_truth": 0}, {"key": "41072994", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.566018536088929, "ground_truth": 0}, {"key": "41072994", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419575383318, "ground_truth": 0}, {"key": "41072994", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984779767281, "ground_truth": 0}, {"key": "38396247", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.831143064205587, "ground_truth": 0}, {"key": "38396247", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7170118805433435, "ground_truth": 0}, {"key": "38396247", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8365545638084614, "ground_truth": 0}, {"key": "38396247", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122995355646, "ground_truth": 0}, {"key": "38396247", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.777299869312679, "ground_truth": 0}, {"key": "37507998", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8438951108178966, "ground_truth": 0}, {"key": "37507998", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8311430501706808, "ground_truth": 0}, {"key": "37507998", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9039745128615881, "ground_truth": 0}, {"key": "37507998", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545559876996, "ground_truth": 0}, {"key": "37507998", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145793298617, "ground_truth": 0}, {"key": "32593929", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.598312179054081, "ground_truth": 0}, {"key": "32593929", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5602526496170633, "ground_truth": 0}, {"key": "32593929", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6352224385210666, "ground_truth": 0}, {"key": "32593929", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704661305279, "ground_truth": 0}, {"key": "32593929", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794003808561178, "ground_truth": 0}, {"key": "36056449", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5389831999636319, "ground_truth": 0}, {"key": "36056449", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7074047094740824, "ground_truth": 0}, {"key": "36056449", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7154239878184556, "ground_truth": 0}, {"key": "36056449", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615984979667, "ground_truth": 0}, {"key": "36056449", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316711066694, "ground_truth": 0}, {"key": "21986185", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7279754355065731, "ground_truth": 0}, {"key": "21986185", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7879311922919652, "ground_truth": 0}, {"key": "21986185", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6723316970368808, "ground_truth": 0}, {"key": "21986185", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760138133545, "ground_truth": 0}, {"key": "21986185", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.660172373370491, "ground_truth": 0}, {"key": "40757465", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6859494665992246, "ground_truth": 0}, {"key": "40757465", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6495786364395957, "ground_truth": 0}, {"key": "40757465", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6531269255142905, "ground_truth": 0}, {"key": "40757465", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293644749408, "ground_truth": 0}, {"key": "40757465", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872013571421, "ground_truth": 0}, {"key": "35198313", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6943026629659088, "ground_truth": 0}, {"key": "35198313", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6566582596311897, "ground_truth": 0}, {"key": "35198313", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6566582555160229, "ground_truth": 0}, {"key": "35198313", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883612339123, "ground_truth": 0}, {"key": "35198313", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.61508785941772, "ground_truth": 0}, {"key": "30604618", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7386690693683386, "ground_truth": 0}, {"key": "30604618", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.620621610970304, "ground_truth": 0}, {"key": "30604618", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7704647796617008, "ground_truth": 0}, {"key": "30604618", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689884361668, "ground_truth": 0}, {"key": "30604618", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013613533009, "ground_truth": 0}, {"key": "35779006", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704648004276888, "ground_truth": 0}, {"key": "35779006", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6206216347582992, "ground_truth": 0}, {"key": "35779006", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6584175169744744, "ground_truth": 0}, {"key": "35779006", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898574464205, "ground_truth": 0}, {"key": "35779006", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884691144812, "ground_truth": 0}, {"key": "33858956", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6791787158145113, "ground_truth": 0}, {"key": "33858956", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.743168005223982, "ground_truth": 0}, {"key": "33858956", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.83548352949552, "ground_truth": 0}, {"key": "33858956", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545486086026, "ground_truth": 0}, {"key": "33858956", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253655866337, "ground_truth": 0}, {"key": "38633880", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7371581746157924, "ground_truth": 0}, {"key": "38633880", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6601723923507282, "ground_truth": 0}, {"key": "38633880", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7520125865549161, "ground_truth": 0}, {"key": "38633880", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935643785837, "ground_truth": 0}, {"key": "38633880", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442250948099659, "ground_truth": 0}, {"key": "36654905", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9820137891113527, "ground_truth": 0}, {"key": "36654905", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9908034470025768, "ground_truth": 0}, {"key": "36654905", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9805806503895818, "ground_truth": 0}, {"key": "36654905", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9553191306227872, "ground_truth": 0}, {"key": "36654905", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9575961682060348, "ground_truth": 0}, {"key": "26547482", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6095241912356325, "ground_truth": 0}, {"key": "26547482", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5312093394007417, "ground_truth": 0}, {"key": "26547482", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.43974733397652815, "ground_truth": 0}, {"key": "26547482", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318310902333, "ground_truth": 0}, {"key": "26547482", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365586776701, "ground_truth": 0}, {"key": "36439068", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8365545673458287, "ground_truth": 0}, {"key": "36439068", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5506073747850596, "ground_truth": 0}, {"key": "36439068", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7008948024102223, "ground_truth": 0}, {"key": "36439068", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013835308733, "ground_truth": 0}, {"key": "36439068", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666115451472, "ground_truth": 0}, {"key": "30501258", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9656413094073255, "ground_truth": 0}, {"key": "30501258", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9202179920433617, "ground_truth": 0}, {"key": "30501258", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.954307967213939, "ground_truth": 0}, {"key": "30501258", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.927363292445023, "ground_truth": 0}, {"key": "30501258", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632902303662, "ground_truth": 0}, {"key": "37560941", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7386690730163723, "ground_truth": 0}, {"key": "37560941", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7248702758165247, "ground_truth": 0}, {"key": "37560941", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358178554826, "ground_truth": 0}, {"key": "37560941", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358224702096, "ground_truth": 0}, {"key": "37560941", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631423610273, "ground_truth": 0}, {"key": "36801665", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9046505300300429, "ground_truth": 0}, {"key": "36801665", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9481545342632591, "ground_truth": 0}, {"key": "36801665", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8587185855281958, "ground_truth": 0}, {"key": "36801665", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952947534604, "ground_truth": 0}, {"key": "36801665", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876988135826, "ground_truth": 0}, {"key": "34954610", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7138307466875738, "ground_truth": 0}, {"key": "34954610", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.620621605099392, "ground_truth": 0}, {"key": "34954610", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.607663177401037, "ground_truth": 0}, {"key": "34954610", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.680878624962504, "ground_truth": 0}, {"key": "34954610", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324824985574, "ground_truth": 0}, {"key": "37020510", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8499711768691378, "ground_truth": 0}, {"key": "37020510", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933457731545, "ground_truth": 0}, {"key": "37020510", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7732163590256252, "ground_truth": 0}, {"key": "37020510", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.808067199690502, "ground_truth": 0}, {"key": "37020510", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256472580274, "ground_truth": 0}, {"key": "38064637", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6169358241012988, "ground_truth": 0}, {"key": "38064637", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7310585843232617, "ground_truth": 0}, {"key": "38064637", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5660185496984899, "ground_truth": 0}, {"key": "38064637", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983121946265941, "ground_truth": 0}, {"key": "38064637", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.682573747248668, "ground_truth": 0}, {"key": "40886108", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104457533083, "ground_truth": 0}, {"key": "40886108", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127652426545, "ground_truth": 0}, {"key": "40886108", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8615382239485668, "ground_truth": 0}, {"key": "40886108", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887588036583414, "ground_truth": 0}, {"key": "40886108", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104540841942, "ground_truth": 0}, {"key": "38554603", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6757646021731947, "ground_truth": 0}, {"key": "38554603", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8031738132576375, "ground_truth": 0}, {"key": "38554603", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5832033499480618, "ground_truth": 0}, {"key": "38554603", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337043352179, "ground_truth": 0}, {"key": "38554603", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918460622743, "ground_truth": 0}, {"key": "39115586", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315942828836985, "ground_truth": 0}, {"key": "39115586", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6740505015798223, "ground_truth": 0}, {"key": "39115586", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6187804163123616, "ground_truth": 0}, {"key": "39115586", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512876907811, "ground_truth": 0}, {"key": "39115586", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283211753703, "ground_truth": 0}, {"key": "38786314", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673289499372, "ground_truth": 0}, {"key": "38786314", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8848377768100341, "ground_truth": 0}, {"key": "38786314", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8832359831184331, "ground_truth": 0}, {"key": "38786314", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333245750187945, "ground_truth": 0}, {"key": "38786314", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631484777714, "ground_truth": 0}, {"key": "38721078", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9196425330085816, "ground_truth": 0}, {"key": "38721078", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.89982778986037, "ground_truth": 0}, {"key": "38721078", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9155072493540786, "ground_truth": 0}, {"key": "38721078", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9230391628728584, "ground_truth": 0}, {"key": "38721078", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743675225964, "ground_truth": 0}, {"key": "39475467", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.732591845268845, "ground_truth": 0}, {"key": "39475467", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6132365639174326, "ground_truth": 0}, {"key": "39475467", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7592254029842557, "ground_truth": 0}, {"key": "39475467", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526407657284, "ground_truth": 0}, {"key": "39475467", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014071261128, "ground_truth": 0}, {"key": "35691234", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8799743600613691, "ground_truth": 0}, {"key": "35691234", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.67233170003677, "ground_truth": 0}, {"key": "35691234", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431680033049913, "ground_truth": 0}, {"key": "35691234", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786265465553, "ground_truth": 0}, {"key": "35691234", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935426111931, "ground_truth": 0}, {"key": "36871390", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7248702897931208, "ground_truth": 0}, {"key": "36871390", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7341195454670748, "ground_truth": 0}, {"key": "36871390", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506676549271, "ground_truth": 0}, {"key": "36871390", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059523448151, "ground_truth": 0}, {"key": "36871390", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872242272938, "ground_truth": 0}, {"key": "31730844", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7401743445152114, "ground_truth": 0}, {"key": "31730844", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7401743506436391, "ground_truth": 0}, {"key": "31730844", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8128673134114248, "ground_truth": 0}, {"key": "31730844", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897189485665, "ground_truth": 0}, {"key": "31730844", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640230208098, "ground_truth": 0}, {"key": "30810940", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5660185598121804, "ground_truth": 0}, {"key": "30810940", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.505859095610133, "ground_truth": 0}, {"key": "30810940", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6654105651845839, "ground_truth": 0}, {"key": "30810940", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493249605351, "ground_truth": 0}, {"key": "30810940", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544222198186, "ground_truth": 0}, {"key": "39352003", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9273632947398273, "ground_truth": 0}, {"key": "39352003", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9032942043421641, "ground_truth": 0}, {"key": "39352003", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8714748574597736, "ground_truth": 0}, {"key": "39352003", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009582291368, "ground_truth": 0}, {"key": "39352003", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9367494806073354, "ground_truth": 0}, {"key": "40118123", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6859494386386044, "ground_truth": 0}, {"key": "40118123", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6513548706962423, "ground_truth": 0}, {"key": "40118123", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6688802716050433, "ground_truth": 0}, {"key": "40118123", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.535098457178145, "ground_truth": 0}, {"key": "40118123", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241635687733, "ground_truth": 0}, {"key": "37114191", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7416740164641065, "ground_truth": 0}, {"key": "37114191", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5755880415616431, "ground_truth": 0}, {"key": "37114191", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6636689422169728, "ground_truth": 0}, {"key": "37114191", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746274865306, "ground_truth": 0}, {"key": "37114191", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476716582094, "ground_truth": 0}, {"key": "39268203", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.849971174471962, "ground_truth": 0}, {"key": "39268203", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8824278714963419, "ground_truth": 0}, {"key": "39268203", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338449492127, "ground_truth": 0}, {"key": "39268203", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358436782605, "ground_truth": 0}, {"key": "39268203", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646959041612, "ground_truth": 0}, {"key": "37950968", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8940517045388283, "ground_truth": 0}, {"key": "37950968", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.709019127967634, "ground_truth": 0}, {"key": "37950968", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7401743575320517, "ground_truth": 0}, {"key": "37950968", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117862152341, "ground_truth": 0}, {"key": "37950968", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195192463109, "ground_truth": 0}, {"key": "34959807", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8152324876452847, "ground_truth": 0}, {"key": "34959807", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7386690560107536, "ground_truth": 0}, {"key": "34959807", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006920046676232, "ground_truth": 0}, {"key": "34959807", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419721743434, "ground_truth": 0}, {"key": "34959807", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059543522707, "ground_truth": 0}, {"key": "35631314", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8558511345477674, "ground_truth": 0}, {"key": "35631314", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.744656339760193, "ground_truth": 0}, {"key": "35631314", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9012274112051166, "ground_truth": 0}, {"key": "35631314", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755701559368, "ground_truth": 0}, {"key": "35631314", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631535576467, "ground_truth": 0}, {"key": "38082365", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8587185844848205, "ground_truth": 0}, {"key": "38082365", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8732148200088783, "ground_truth": 0}, {"key": "38082365", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.724870282023962, "ground_truth": 0}, {"key": "38082365", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675358478516, "ground_truth": 0}, {"key": "38082365", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388037933645, "ground_truth": 0}, {"key": "37242829", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6636689560718473, "ground_truth": 0}, {"key": "37242829", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6095241701711216, "ground_truth": 0}, {"key": "37242829", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5078118677009082, "ground_truth": 0}, {"key": "37242829", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953721641052, "ground_truth": 0}, {"key": "37242829", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852886581121373, "ground_truth": 0}, {"key": "38556068", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5039061521349486, "ground_truth": 0}, {"key": "38556068", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5428632850850948, "ground_truth": 0}, {"key": "38556068", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.544801390742179, "ground_truth": 0}, {"key": "38556068", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434959454512, "ground_truth": 0}, {"key": "38556068", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680355830796, "ground_truth": 0}, {"key": "32969336", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8164063736450692, "ground_truth": 0}, {"key": "32969336", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8365545671814749, "ground_truth": 0}, {"key": "32969336", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7620701178692668, "ground_truth": 0}, {"key": "32969336", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303264734245, "ground_truth": 0}, {"key": "32969336", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254128529724, "ground_truth": 0}, {"key": "36825153", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7356416693632896, "ground_truth": 0}, {"key": "36825153", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7025300397262131, "ground_truth": 0}, {"key": "36825153", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7446563276569877, "ground_truth": 0}, {"key": "36825153", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743488908479, "ground_truth": 0}, {"key": "36825153", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437592807035, "ground_truth": 0}, {"key": "41050146", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8499711671177658, "ground_truth": 0}, {"key": "41050146", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7704647684373088, "ground_truth": 0}, {"key": "41050146", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7839884710689532, "ground_truth": 0}, {"key": "41050146", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346080622095, "ground_truth": 0}, {"key": "41050146", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.827828166541748, "ground_truth": 0}, {"key": "27865037", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5964331257043862, "ground_truth": 0}, {"key": "27865037", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.36477757104842906, "ground_truth": 0}, {"key": "27865037", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.46295861315939496, "ground_truth": 0}, {"key": "27865037", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.527316518206791, "ground_truth": 0}, {"key": "27865037", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593518968045, "ground_truth": 0}, {"key": "39868565", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8459424432058399, "ground_truth": 0}, {"key": "39868565", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159634366019, "ground_truth": 0}, {"key": "39868565", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8509647117696957, "ground_truth": 0}, {"key": "39868565", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672207953966, "ground_truth": 0}, {"key": "39868565", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.789233682859131, "ground_truth": 0}, {"key": "37761968", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.658417489335662, "ground_truth": 0}, {"key": "37761968", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850360548149, "ground_truth": 0}, {"key": "37761968", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.775944563331536, "ground_truth": 0}, {"key": "37761968", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118932758088, "ground_truth": 0}, {"key": "37761968", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175293372646, "ground_truth": 0}, {"key": "16326139", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7577943686719285, "ground_truth": 0}, {"key": "16326139", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.760650662529992, "ground_truth": 0}, {"key": "16326139", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7074047038903448, "ground_truth": 0}, {"key": "16326139", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142389328015, "ground_truth": 0}, {"key": "16326139", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646044411902, "ground_truth": 0}, {"key": "36568381", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9136765203051658, "ground_truth": 0}, {"key": "36568381", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511485884036, "ground_truth": 0}, {"key": "36568381", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.910545392404669, "ground_truth": 0}, {"key": "36568381", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288471609046, "ground_truth": 0}, {"key": "36568381", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190633003158338, "ground_truth": 0}, {"key": "39855613", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7866228324347512, "ground_truth": 0}, {"key": "39855613", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354756312213, "ground_truth": 0}, {"key": "39855613", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.905322309721348, "ground_truth": 0}, {"key": "39855613", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145769395032, "ground_truth": 0}, {"key": "39855613", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142495892511, "ground_truth": 0}, {"key": "29856302", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.618780449485634, "ground_truth": 0}, {"key": "29856302", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909762945741189, "ground_truth": 0}, {"key": "29856302", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.4804786642003094, "ground_truth": 0}, {"key": "29856302", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.63883529730227, "ground_truth": 0}, {"key": "29856302", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224375718292, "ground_truth": 0}, {"key": "35641106", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074046990360561, "ground_truth": 0}, {"key": "35641106", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5983121904984263, "ground_truth": 0}, {"key": "35641106", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191378235708, "ground_truth": 0}, {"key": "35641106", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321916710995, "ground_truth": 0}, {"key": "35641106", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228767602593, "ground_truth": 0}, {"key": "39474558", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074047200962358, "ground_truth": 0}, {"key": "39474558", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6352224479463192, "ground_truth": 0}, {"key": "39474558", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6959583369980481, "ground_truth": 0}, {"key": "39474558", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802475521271, "ground_truth": 0}, {"key": "39474558", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549150078263952, "ground_truth": 0}, {"key": "34338135", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9546474246979904, "ground_truth": 0}, {"key": "34338135", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9219218341727271, "ground_truth": 0}, {"key": "34338135", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9403530564584283, "ground_truth": 0}, {"key": "34338135", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099580005232, "ground_truth": 0}, {"key": "34338135", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.919642524076801, "ground_truth": 0}, {"key": "35870330", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7057850251727644, "ground_truth": 0}, {"key": "35870330", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8031737943384935, "ground_truth": 0}, {"key": "35870330", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8080672250987445, "ground_truth": 0}, {"key": "35870330", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445614214933, "ground_truth": 0}, {"key": "35870330", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.798186793675371, "ground_truth": 0}, {"key": "24478245", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7853085949081703, "ground_truth": 0}, {"key": "24478245", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7956580979631545, "ground_truth": 0}, {"key": "24478245", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8255897138033125, "ground_truth": 0}, {"key": "24478245", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321832515654, "ground_truth": 0}, {"key": "24478245", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199623651327, "ground_truth": 0}, {"key": "38485946", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7248702787323359, "ground_truth": 0}, {"key": "38485946", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7592253880360839, "ground_truth": 0}, {"key": "38485946", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7534666712184394, "ground_truth": 0}, {"key": "38485946", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197724177764, "ground_truth": 0}, {"key": "38485946", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918378220907, "ground_truth": 0}, {"key": "32509613", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490872177091398, "ground_truth": 0}, {"key": "32509613", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267118018451942, "ground_truth": 0}, {"key": "32509613", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7718434662378638, "ground_truth": 0}, {"key": "32509613", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122957010063, "ground_truth": 0}, {"key": "32509613", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312190216737, "ground_truth": 0}, {"key": "34078819", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8670357633320427, "ground_truth": 0}, {"key": "34078819", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7918210607327985, "ground_truth": 0}, {"key": "34078819", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8499711713230683, "ground_truth": 0}, {"key": "34078819", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867749543452, "ground_truth": 0}, {"key": "34078819", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872224932449, "ground_truth": 0}, {"key": "39523865", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9005297872765281, "ground_truth": 0}, {"key": "39523865", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869986248684, "ground_truth": 0}, {"key": "39523865", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8749346166077343, "ground_truth": 0}, {"key": "39523865", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846545086416, "ground_truth": 0}, {"key": "39523865", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145739724874, "ground_truth": 0}, {"key": "33146158", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7233094782763257, "ground_truth": 0}, {"key": "33146158", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7648916200382496, "ground_truth": 0}, {"key": "33146158", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059196298535, "ground_truth": 0}, {"key": "33146158", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297745940686934, "ground_truth": 0}, {"key": "33146158", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102502320542, "ground_truth": 0}, {"key": "32083974", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9066531139874556, "ground_truth": 0}, {"key": "32083974", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8116760436226275, "ground_truth": 0}, {"key": "32083974", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9582261191307274, "ground_truth": 0}, {"key": "32083974", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513793982209, "ground_truth": 0}, {"key": "32083974", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099587540905, "ground_truth": 0}, {"key": "34378482", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9299510433203134, "ground_truth": 0}, {"key": "34378482", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976953050061884, "ground_truth": 0}, {"key": "34378482", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9339146215751416, "ground_truth": 0}, {"key": "34378482", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517143976986, "ground_truth": 0}, {"key": "34378482", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213821600753, "ground_truth": 0}, {"key": "38080102", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7446563479146461, "ground_truth": 0}, {"key": "38080102", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.846957840016015, "ground_truth": 0}, {"key": "38080102", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7826624880369843, "ground_truth": 0}, {"key": "38080102", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.735641636127352, "ground_truth": 0}, {"key": "38080102", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704648011418094, "ground_truth": 0}, {"key": "40244537", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5292633801384354, "ground_truth": 0}, {"key": "40244537", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6187804366628773, "ground_truth": 0}, {"key": "40244537", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.607663204226279, "ground_truth": 0}, {"key": "40244537", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585641923554, "ground_truth": 0}, {"key": "40244537", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802600051238, "ground_truth": 0}, {"key": "33497789", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9588471082361377, "ground_truth": 0}, {"key": "33497789", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9299510381981181, "ground_truth": 0}, {"key": "33497789", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9142907220634764, "ground_truth": 0}, {"key": "33497789", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9190632857311776, "ground_truth": 0}, {"key": "33497789", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037270152205, "ground_truth": 0}, {"key": "28816889", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9539660980636084, "ground_truth": 0}, {"key": "28816889", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9412234470592062, "ground_truth": 0}, {"key": "28816889", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377777946468, "ground_truth": 0}, {"key": "28816889", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009632478121, "ground_truth": 0}, {"key": "28816889", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849631980765, "ground_truth": 0}, {"key": "38157127", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6706082817410763, "ground_truth": 0}, {"key": "38157127", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7969253776447373, "ground_truth": 0}, {"key": "38157127", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7592253941938635, "ground_truth": 0}, {"key": "38157127", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872294448316, "ground_truth": 0}, {"key": "38157127", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792094887291, "ground_truth": 0}, {"key": "36183569", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7772998686624808, "ground_truth": 0}, {"key": "36183569", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159623204015, "ground_truth": 0}, {"key": "36183569", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.816406368690377, "ground_truth": 0}, {"key": "36183569", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786253786612, "ground_truth": 0}, {"key": "36183569", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754380114586, "ground_truth": 0}, {"key": "36012016", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315942961876877, "ground_truth": 0}, {"key": "36012016", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6442251467316134, "ground_truth": 0}, {"key": "36012016", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6842640215267387, "ground_truth": 0}, {"key": "36012016", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321924891033, "ground_truth": 0}, {"key": "36012016", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256163404459, "ground_truth": 0}, {"key": "34571973", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8080672225778982, "ground_truth": 0}, {"key": "34571973", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8311430643447573, "ground_truth": 0}, {"key": "34571973", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7648916027920447, "ground_truth": 0}, {"key": "34571973", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339546990594, "ground_truth": 0}, {"key": "34571973", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386691037818691, "ground_truth": 0}, {"key": "38707498", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637631385078, "ground_truth": 0}, {"key": "38707498", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8864204058483053, "ground_truth": 0}, {"key": "38707498", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8670357684534598, "ground_truth": 0}, {"key": "38707498", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672237598985, "ground_truth": 0}, {"key": "38707498", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936385647892, "ground_truth": 0}, {"key": "35459082", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9124361703888314, "ground_truth": 0}, {"key": "35459082", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9433475759837076, "ground_truth": 0}, {"key": "35459082", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9348724523941664, "ground_truth": 0}, {"key": "35459082", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9324533095602151, "ground_truth": 0}, {"key": "35459082", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745100477055, "ground_truth": 0}, {"key": "39464041", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9839708532586325, "ground_truth": 0}, {"key": "39464041", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.980580651314633, "ground_truth": 0}, {"key": "39464041", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9813106923311254, "ground_truth": 0}, {"key": "39464041", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9895109077856229, "ground_truth": 0}, {"key": "39464041", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9902915247123703, "ground_truth": 0}, {"key": "23782052", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7201714941982185, "ground_truth": 0}, {"key": "23782052", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8428631542448551, "ground_truth": 0}, {"key": "23782052", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8998277790517437, "ground_truth": 0}, {"key": "23782052", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063832853351, "ground_truth": 0}, {"key": "23782052", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430467399706, "ground_truth": 0}, {"key": "36568455", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7620700947205522, "ground_truth": 0}, {"key": "36568455", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8397339716868747, "ground_truth": 0}, {"key": "36568455", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7732163625687662, "ground_truth": 0}, {"key": "36568455", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311932511031, "ground_truth": 0}, {"key": "36568455", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036193681288, "ground_truth": 0}, {"key": "38469552", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9167080729600809, "ground_truth": 0}, {"key": "38469552", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9066531297827777, "ground_truth": 0}, {"key": "38469552", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8697145779123429, "ground_truth": 0}, {"key": "38469552", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671467093282, "ground_truth": 0}, {"key": "38469552", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.925768625406041, "ground_truth": 0}, {"key": "35922277", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8757870051109499, "ground_truth": 0}, {"key": "35922277", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869898887555, "ground_truth": 0}, {"key": "35922277", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8459424369034546, "ground_truth": 0}, {"key": "35922277", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797652008227, "ground_truth": 0}, {"key": "35922277", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517077730914, "ground_truth": 0}, {"key": "32744293", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.729519769888007, "ground_truth": 0}, {"key": "32744293", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7201715182735301, "ground_truth": 0}, {"key": "32744293", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6654105525194206, "ground_truth": 0}, {"key": "32744293", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700993423516, "ground_truth": 0}, {"key": "32744293", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526149781811, "ground_truth": 0}, {"key": "30972362", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.81757447940109, "ground_truth": 0}, {"key": "30972362", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8832359887645265, "ground_truth": 0}, {"key": "30972362", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9046505397198887, "ground_truth": 0}, {"key": "30972362", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9190632897465437, "ground_truth": 0}, {"key": "30972362", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876958128635, "ground_truth": 0}, {"key": "36380943", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6909762669057927, "ground_truth": 0}, {"key": "36380943", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8289388204337121, "ground_truth": 0}, {"key": "36380943", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7279754632544323, "ground_truth": 0}, {"key": "36380943", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759697139901, "ground_truth": 0}, {"key": "36380943", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837910441309, "ground_truth": 0}, {"key": "36929355", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7057850262330498, "ground_truth": 0}, {"key": "36929355", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6169358256298902, "ground_truth": 0}, {"key": "36929355", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7041601485233727, "ground_truth": 0}, {"key": "36929355", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289387893675652, "ground_truth": 0}, {"key": "36929355", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.705785031329353, "ground_truth": 0}, {"key": "39127206", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.68594945341759, "ground_truth": 0}, {"key": "39127206", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5273165237845331, "ground_truth": 0}, {"key": "39127206", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.544801407208773, "ground_truth": 0}, {"key": "39127206", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416442646444, "ground_truth": 0}, {"key": "39127206", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786038710651, "ground_truth": 0}, {"key": "36128318", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.791821054081343, "ground_truth": 0}, {"key": "36128318", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.79182107529303, "ground_truth": 0}, {"key": "36128318", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228303790093, "ground_truth": 0}, {"key": "36128318", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423129332878, "ground_truth": 0}, {"key": "36128318", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256005133433, "ground_truth": 0}, {"key": "39863480", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9059898207572621, "ground_truth": 0}, {"key": "39863480", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9130583395586522, "ground_truth": 0}, {"key": "39863480", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9309620667948605, "ground_truth": 0}, {"key": "39863480", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278537171444, "ground_truth": 0}, {"key": "39863480", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357664896768, "ground_truth": 0}, {"key": "38634057", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9334308161515302, "ground_truth": 0}, {"key": "38634057", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9433475733770484, "ground_truth": 0}, {"key": "38634057", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.961243803068561, "ground_truth": 0}, {"key": "38634057", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9433475711815944, "ground_truth": 0}, {"key": "38634057", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105453992472236, "ground_truth": 0}, {"key": "33131935", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9263037193501295, "ground_truth": 0}, {"key": "33131935", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9489172635960376, "ground_truth": 0}, {"key": "33131935", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9086178982435708, "ground_truth": 0}, {"key": "33131935", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681096439042, "ground_truth": 0}, {"key": "33131935", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9358173591790083, "ground_truth": 0}, {"key": "39021319", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8152324987725288, "ground_truth": 0}, {"key": "39021319", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.721743191437577, "ground_truth": 0}, {"key": "39021319", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140528037984188, "ground_truth": 0}, {"key": "39021319", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283917332884, "ground_truth": 0}, {"key": "39021319", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118880517153, "ground_truth": 0}, {"key": "40644571", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6842640385554588, "ground_truth": 0}, {"key": "40644571", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.505859110683944, "ground_truth": 0}, {"key": "40644571", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.575588010103279, "ground_truth": 0}, {"key": "40644571", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317085383722, "ground_truth": 0}, {"key": "40644571", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308164936238, "ground_truth": 0}, {"key": "14681877", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9136765232269035, "ground_truth": 0}, {"key": "14681877", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8940517135557678, "ground_truth": 0}, {"key": "14681877", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8548846446016166, "ground_truth": 0}, {"key": "14681877", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872046033649873, "ground_truth": 0}, {"key": "14681877", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765297728747, "ground_truth": 0}, {"key": "36570890", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.710628290611894, "ground_truth": 0}, {"key": "36570890", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7185943998869511, "ground_truth": 0}, {"key": "36570890", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6113819882644567, "ground_truth": 0}, {"key": "36570890", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762908526116, "ground_truth": 0}, {"key": "36570890", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998642506603, "ground_truth": 0}, {"key": "30452755", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9012274150864524, "ground_truth": 0}, {"key": "30452755", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9111797057643041, "ground_truth": 0}, {"key": "30452755", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8459424416879876, "ground_truth": 0}, {"key": "30452755", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767804079151, "ground_truth": 0}, {"key": "30452755", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869844795564, "ground_truth": 0}, {"key": "37347053", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6460136958615343, "ground_truth": 0}, {"key": "37347053", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6584174847969986, "ground_truth": 0}, {"key": "37347053", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898656830666, "ground_truth": 0}, {"key": "37347053", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269687222437, "ground_truth": 0}, {"key": "37347053", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122322114877981, "ground_truth": 0}, {"key": "38890979", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.732591844623965, "ground_truth": 0}, {"key": "38890979", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7431679993950644, "ground_truth": 0}, {"key": "38890979", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.715424003945009, "ground_truth": 0}, {"key": "38890979", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.684264029777164, "ground_truth": 0}, {"key": "38890979", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918453943606, "ground_truth": 0}, {"key": "32974694", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797549452084, "ground_truth": 0}, {"key": "32974694", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.883235985554862, "ground_truth": 0}, {"key": "32974694", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835346217145, "ground_truth": 0}, {"key": "32974694", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9230391625487068, "ground_truth": 0}, {"key": "32974694", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849651227043, "ground_truth": 0}, {"key": "38519940", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9167080751585301, "ground_truth": 0}, {"key": "38519940", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.934395163699353, "ground_truth": 0}, {"key": "38519940", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9532750415835386, "ground_truth": 0}, {"key": "38519940", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9529258221224931, "ground_truth": 0}, {"key": "38519940", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9515039971627052, "ground_truth": 0}, {"key": "38870104", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.884039286002206, "ground_truth": 0}, {"key": "38870104", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.885631478343046, "ground_truth": 0}, {"key": "38870104", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.790530308054754, "ground_truth": 0}, {"key": "38870104", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647178629413, "ground_truth": 0}, {"key": "38870104", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972595343727, "ground_truth": 0}, {"key": "34283161", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6513548761869017, "ground_truth": 0}, {"key": "34283161", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.737158158435119, "ground_truth": 0}, {"key": "34283161", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5544704884326986, "ground_truth": 0}, {"key": "34283161", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581887105308, "ground_truth": 0}, {"key": "34283161", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666289396718, "ground_truth": 0}, {"key": "31650463", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7170119019179287, "ground_truth": 0}, {"key": "31650463", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437765401888, "ground_truth": 0}, {"key": "31650463", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7813306179309838, "ground_truth": 0}, {"key": "31650463", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210666134374, "ground_truth": 0}, {"key": "31650463", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744911288787, "ground_truth": 0}, {"key": "35589432", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8244619344781297, "ground_truth": 0}, {"key": "35589432", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.795658104406413, "ground_truth": 0}, {"key": "35589432", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7799928791660783, "ground_truth": 0}, {"key": "35589432", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.856812291955113, "ground_truth": 0}, {"key": "35589432", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640163097767, "ground_truth": 0}, {"key": "14412752", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7866228379415, "ground_truth": 0}, {"key": "14412752", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8116760209610163, "ground_truth": 0}, {"key": "14412752", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7505527715037218, "ground_truth": 0}, {"key": "14412752", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506448793825, "ground_truth": 0}, {"key": "14412752", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367821925544, "ground_truth": 0}, {"key": "37271183", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9496693693865987, "ground_truth": 0}, {"key": "37271183", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9553191313547531, "ground_truth": 0}, {"key": "37271183", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9635062323857502, "ground_truth": 0}, {"key": "37271183", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872098167434, "ground_truth": 0}, {"key": "37271183", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9572778027738015, "ground_truth": 0}, {"key": "35588153", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9039745120837209, "ground_truth": 0}, {"key": "35588153", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9202179816750493, "ground_truth": 0}, {"key": "35588153", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9563089418020339, "ground_truth": 0}, {"key": "35588153", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122220533216, "ground_truth": 0}, {"key": "35588153", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9358173577013214, "ground_truth": 0}, {"key": "39876692", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445431293603, "ground_truth": 0}, {"key": "39876692", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7634837637293687, "ground_truth": 0}, {"key": "39876692", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7549149776893695, "ground_truth": 0}, {"key": "39876692", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689435643799, "ground_truth": 0}, {"key": "39876692", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786929703573, "ground_truth": 0}, {"key": "38992323", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333246029012831, "ground_truth": 0}, {"key": "38992323", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7233094642593708, "ground_truth": 0}, {"key": "38992323", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8365545455980462, "ground_truth": 0}, {"key": "38992323", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916260346603, "ground_truth": 0}, {"key": "38992323", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389957313358, "ground_truth": 0}, {"key": "37556002", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6825737479045043, "ground_truth": 0}, {"key": "37556002", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5506073542691298, "ground_truth": 0}, {"key": "37556002", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388111225467, "ground_truth": 0}, {"key": "37556002", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740232564326, "ground_truth": 0}, {"key": "37556002", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.735641642168841, "ground_truth": 0}, {"key": "39875801", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9079671350238662, "ground_truth": 0}, {"key": "39875801", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9230391685255539, "ground_truth": 0}, {"key": "39875801", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9263037277580736, "ground_truth": 0}, {"key": "39875801", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149071483698, "ground_truth": 0}, {"key": "39875801", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080797561505, "ground_truth": 0}, {"key": "39272285", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5097643890543633, "ground_truth": 0}, {"key": "39272285", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.3593641426351203, "ground_truth": 0}, {"key": "39272285", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.44360040921297617, "ground_truth": 0}, {"key": "39272285", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474602900673558, "ground_truth": 0}, {"key": "39272285", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526455697884, "ground_truth": 0}, {"key": "39629714", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7577943750431185, "ground_truth": 0}, {"key": "39629714", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217432041144676, "ground_truth": 0}, {"key": "39629714", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5428632712154542, "ground_truth": 0}, {"key": "39629714", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419879063954, "ground_truth": 0}, {"key": "39629714", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118945878393, "ground_truth": 0}, {"key": "34043257", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8344068860015829, "ground_truth": 0}, {"key": "34043257", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8210441086104767, "ground_truth": 0}, {"key": "34043257", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631330594846, "ground_truth": 0}, {"key": "34043257", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359813532059, "ground_truth": 0}, {"key": "34043257", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825906345372, "ground_truth": 0}, {"key": "33995240", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5563995669489464, "ground_truth": 0}, {"key": "33995240", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754539433759, "ground_truth": 0}, {"key": "33995240", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6495786088749436, "ground_truth": 0}, {"key": "33995240", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206215988745796, "ground_truth": 0}, {"key": "33995240", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213283797766, "ground_truth": 0}, {"key": "39399948", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.951142223318105, "ground_truth": 0}, {"key": "39399948", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9518632322945402, "ground_truth": 0}, {"key": "39399948", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8887587845946385, "ground_truth": 0}, {"key": "39399948", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9453993968707369, "ground_truth": 0}, {"key": "39399948", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8887587942502505, "ground_truth": 0}, {"key": "33185890", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732164062302918, "ground_truth": 0}, {"key": "33185890", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7248702913384316, "ground_truth": 0}, {"key": "33185890", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104789009196861, "ground_truth": 0}, {"key": "33185890", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527498058627, "ground_truth": 0}, {"key": "33185890", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082760549844, "ground_truth": 0}, {"key": "35280425", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382069120642, "ground_truth": 0}, {"key": "35280425", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7718434909005535, "ground_truth": 0}, {"key": "35280425", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059311306511, "ground_truth": 0}, {"key": "35280425", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757870024380928, "ground_truth": 0}, {"key": "35280425", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283899813849, "ground_truth": 0}, {"key": "16365170", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9173026624284055, "ground_truth": 0}, {"key": "16365170", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.920217988059391, "ground_truth": 0}, {"key": "16365170", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8596637466063616, "ground_truth": 0}, {"key": "16365170", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256520461695, "ground_truth": 0}, {"key": "16365170", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281489362415, "ground_truth": 0}, {"key": "24388238", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6926419804709603, "ground_truth": 0}, {"key": "24388238", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7264256011245093, "ground_truth": 0}, {"key": "24388238", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8152324854873023, "ground_truth": 0}, {"key": "24388238", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085808425067, "ground_truth": 0}, {"key": "24388238", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916129880785, "ground_truth": 0}, {"key": "35024827", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8044059163708703, "ground_truth": 0}, {"key": "35024827", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7786493191154307, "ground_truth": 0}, {"key": "35024827", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8459424447615788, "ground_truth": 0}, {"key": "35024827", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307685527314, "ground_truth": 0}, {"key": "35024827", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544274653459, "ground_truth": 0}, {"key": "38624944", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333246006364641, "ground_truth": 0}, {"key": "38624944", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8164063781135343, "ground_truth": 0}, {"key": "38624944", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8233284006662688, "ground_truth": 0}, {"key": "38624944", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833903386892, "ground_truth": 0}, {"key": "38624944", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737988302274, "ground_truth": 0}, {"key": "34719830", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8278281510680696, "ground_truth": 0}, {"key": "34719830", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568123008738289, "ground_truth": 0}, {"key": "34719830", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7170118684312696, "ground_truth": 0}, {"key": "34719830", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047117146747, "ground_truth": 0}, {"key": "34719830", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884710767625, "ground_truth": 0}, {"key": "38995225", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105556185905, "ground_truth": 0}, {"key": "38995225", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9230391603894551, "ground_truth": 0}, {"key": "38995225", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8774767802734098, "ground_truth": 0}, {"key": "38995225", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361644493089, "ground_truth": 0}, {"key": "38995225", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.864310456157068, "ground_truth": 0}, {"key": "34242311", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104584823833, "ground_truth": 0}, {"key": "34242311", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6706082811038064, "ground_truth": 0}, {"key": "34242311", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.804405921310963, "ground_truth": 0}, {"key": "34242311", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799929015887324, "ground_truth": 0}, {"key": "34242311", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748565546375, "ground_truth": 0}, {"key": "39253748", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9706877694499495, "ground_truth": 0}, {"key": "39253748", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9469902273148854, "ground_truth": 0}, {"key": "39253748", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9522199326630207, "ground_truth": 0}, {"key": "39253748", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9496693672685804, "ground_truth": 0}, {"key": "39253748", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9640516784714406, "ground_truth": 0}, {"key": "37131104", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9926541738315728, "ground_truth": 0}, {"key": "37131104", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9949788502598809, "ground_truth": 0}, {"key": "37131104", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9908034475089191, "ground_truth": 0}, {"key": "37131104", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9890976280184363, "ground_truth": 0}, {"key": "37131104", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9920002452547122, "ground_truth": 0}, {"key": "38490554", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8278281512453423, "ground_truth": 0}, {"key": "38490554", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7866228317114318, "ground_truth": 0}, {"key": "38490554", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187368085447678, "ground_truth": 0}, {"key": "38490554", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675359425454, "ground_truth": 0}, {"key": "38490554", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204006065608, "ground_truth": 0}, {"key": "29009500", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.769080231623766, "ground_truth": 0}, {"key": "29009500", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6442251034544364, "ground_truth": 0}, {"key": "29009500", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8152324832313872, "ground_truth": 0}, {"key": "29009500", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.585101168188897, "ground_truth": 0}, {"key": "29009500", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883566266758, "ground_truth": 0}, {"key": "36703057", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8539127463623456, "ground_truth": 0}, {"key": "36703057", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8459424542533934, "ground_truth": 0}, {"key": "36703057", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.838679761778763, "ground_truth": 0}, {"key": "36703057", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.891054952906965, "ground_truth": 0}, {"key": "36703057", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424443296982, "ground_truth": 0}, {"key": "34876987", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9736446472113548, "ground_truth": 0}, {"key": "34876987", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9609517039364486, "ground_truth": 0}, {"key": "34876987", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9556514180895381, "ground_truth": 0}, {"key": "34876987", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9441768601355846, "ground_truth": 0}, {"key": "34876987", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9465966679653028, "ground_truth": 0}, {"key": "36209258", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8365545711703267, "ground_truth": 0}, {"key": "36209258", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9005297929838062, "ground_truth": 0}, {"key": "36209258", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338469457079, "ground_truth": 0}, {"key": "36209258", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106283246644293, "ground_truth": 0}, {"key": "36209258", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936526734788, "ground_truth": 0}, {"key": "36854437", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6206216078666633, "ground_truth": 0}, {"key": "36854437", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5983121804688583, "ground_truth": 0}, {"key": "36854437", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.46879061409143574, "ground_truth": 0}, {"key": "36854437", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016877759280589, "ground_truth": 0}, {"key": "36854437", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.519521330330104, "ground_truth": 0}, {"key": "38047723", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648916096823902, "ground_truth": 0}, {"key": "38047723", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7505527686907706, "ground_truth": 0}, {"key": "38047723", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6020616164318185, "ground_truth": 0}, {"key": "38047723", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299926046374, "ground_truth": 0}, {"key": "38047723", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228276039863, "ground_truth": 0}, {"key": "34287816", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6076631889326161, "ground_truth": 0}, {"key": "34287816", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.695958303040813, "ground_truth": 0}, {"key": "34287816", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7106283114718657, "ground_truth": 0}, {"key": "34287816", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504877694795, "ground_truth": 0}, {"key": "34287816", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995870993881, "ground_truth": 0}, {"key": "33235855", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9263037373412945, "ground_truth": 0}, {"key": "33235855", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9433475700749083, "ground_truth": 0}, {"key": "33235855", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9546474180853173, "ground_truth": 0}, {"key": "33235855", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494705845645, "ground_truth": 0}, {"key": "33235855", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.925229958070042, "ground_truth": 0}, {"key": "34381016", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163708622832, "ground_truth": 0}, {"key": "34381016", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8210441007300765, "ground_truth": 0}, {"key": "34381016", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8365545605647414, "ground_truth": 0}, {"key": "34381016", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122923820761, "ground_truth": 0}, {"key": "34381016", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526165477135, "ground_truth": 0}, {"key": "28064995", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8221891381694955, "ground_truth": 0}, {"key": "28064995", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357664800892, "ground_truth": 0}, {"key": "28064995", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6976089162587452, "ground_truth": 0}, {"key": "28064995", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549150028005751, "ground_truth": 0}, {"key": "28064995", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441186536628, "ground_truth": 0}, {"key": "37576197", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5755880295550686, "ground_truth": 0}, {"key": "37576197", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5058591116437304, "ground_truth": 0}, {"key": "37576197", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6206216413811015, "ground_truth": 0}, {"key": "37576197", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746092493184, "ground_truth": 0}, {"key": "37576197", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011607794494, "ground_truth": 0}, {"key": "34454741", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.480478683711542, "ground_truth": 0}, {"key": "34454741", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4902356191090024, "ground_truth": 0}, {"key": "34454741", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6424324632501642, "ground_truth": 0}, {"key": "34454741", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.573678382615808, "ground_truth": 0}, {"key": "34454741", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324730554419, "ground_truth": 0}, {"key": "34766970", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7295197902088351, "ground_truth": 0}, {"key": "34766970", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6279511990504647, "ground_truth": 0}, {"key": "34766970", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.718594391690163, "ground_truth": 0}, {"key": "34766970", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191241316385, "ground_truth": 0}, {"key": "34766970", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224175000952, "ground_truth": 0}, {"key": "35574186", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8872045887356036, "ground_truth": 0}, {"key": "35574186", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8255897226399418, "ground_truth": 0}, {"key": "35574186", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8955226804834713, "ground_truth": 0}, {"key": "35574186", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748637412443, "ground_truth": 0}, {"key": "35574186", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625205098463, "ground_truth": 0}, {"key": "35486470", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.750552742155718, "ground_truth": 0}, {"key": "35486470", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6893056061275941, "ground_truth": 0}, {"key": "35486470", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7534666529505849, "ground_truth": 0}, {"key": "35486470", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089166223173, "ground_truth": 0}, {"key": "35486470", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102708531756, "ground_truth": 0}, {"key": "40977702", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6976089259310482, "ground_truth": 0}, {"key": "40977702", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6757646098222788, "ground_truth": 0}, {"key": "40977702", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6601723636687947, "ground_truth": 0}, {"key": "40977702", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601283830289, "ground_truth": 0}, {"key": "40977702", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671477105298358, "ground_truth": 0}, {"key": "35336618", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6531269161501617, "ground_truth": 0}, {"key": "35336618", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7264256054021705, "ground_truth": 0}, {"key": "35336618", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7534666455515615, "ground_truth": 0}, {"key": "35336618", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424325168047473, "ground_truth": 0}, {"key": "35336618", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916170887721, "ground_truth": 0}, {"key": "33024679", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.796925372798806, "ground_truth": 0}, {"key": "33024679", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.713830745766604, "ground_truth": 0}, {"key": "33024679", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8816149092002088, "ground_truth": 0}, {"key": "33024679", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434999010897, "ground_truth": 0}, {"key": "33024679", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210440944449037, "ground_truth": 0}, {"key": "37451334", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.767689855778328, "ground_truth": 0}, {"key": "37451334", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7248702707538994, "ground_truth": 0}, {"key": "37451334", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159821928132, "ground_truth": 0}, {"key": "37451334", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493286920471, "ground_truth": 0}, {"key": "37451334", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.832236655170665, "ground_truth": 0}, {"key": "33354824", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.45519863141928846, "ground_truth": 0}, {"key": "33354824", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4205996200183866, "ground_truth": 0}, {"key": "33354824", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.420599570388077, "ground_truth": 0}, {"key": "33354824", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.523420375234129, "ground_truth": 0}, {"key": "33354824", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.564098490804044, "ground_truth": 0}, {"key": "34688538", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8766343796162022, "ground_truth": 0}, {"key": "34688538", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8233283805374872, "ground_truth": 0}, {"key": "34688538", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8697145853026322, "ground_truth": 0}, {"key": "34688538", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.874934628414046, "ground_truth": 0}, {"key": "34688538", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199701858371, "ground_truth": 0}, {"key": "33646276", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6424324910826367, "ground_truth": 0}, {"key": "33646276", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6352224380155588, "ground_truth": 0}, {"key": "33646276", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6671476665752744, "ground_truth": 0}, {"key": "33646276", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046809616225, "ground_truth": 0}, {"key": "33646276", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317039574351, "ground_truth": 0}, {"key": "40322608", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9184802524990541, "ground_truth": 0}, {"key": "40322608", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.898410542625706, "ground_truth": 0}, {"key": "40322608", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9257686259528425, "ground_truth": 0}, {"key": "40322608", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869780157076, "ground_truth": 0}, {"key": "40322608", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.928408793296935, "ground_truth": 0}, {"key": "39565762", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7446563472775685, "ground_truth": 0}, {"key": "39565762", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267117842571671, "ground_truth": 0}, {"key": "39565762", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6388352849789468, "ground_truth": 0}, {"key": "39565762", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159642630875, "ground_truth": 0}, {"key": "39565762", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690616186257, "ground_truth": 0}, {"key": "30534259", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490872046958693, "ground_truth": 0}, {"key": "30534259", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217432108421116, "ground_truth": 0}, {"key": "30534259", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7356416422160152, "ground_truth": 0}, {"key": "30534259", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876300219944012, "ground_truth": 0}, {"key": "30534259", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365706035722, "ground_truth": 0}, {"key": "39644242", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8469578339998873, "ground_truth": 0}, {"key": "39644242", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528168150189, "ground_truth": 0}, {"key": "39644242", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8633916172997076, "ground_truth": 0}, {"key": "39644242", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849634677707, "ground_truth": 0}, {"key": "39644242", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300783977938, "ground_truth": 0}, {"key": "19853740", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6926419895346728, "ground_truth": 0}, {"key": "19853740", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624812151274, "ground_truth": 0}, {"key": "19853740", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228105141027, "ground_truth": 0}, {"key": "19853740", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199634374503, "ground_truth": 0}, {"key": "19853740", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366523533268, "ground_truth": 0}, {"key": "33023078", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8783142387562397, "ground_truth": 0}, {"key": "33023078", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8068526338929632, "ground_truth": 0}, {"key": "33023078", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8568122989314547, "ground_truth": 0}, {"key": "33023078", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357643455673, "ground_truth": 0}, {"key": "33023078", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117803059582, "ground_truth": 0}, {"key": "38329806", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6893056152076129, "ground_truth": 0}, {"key": "38329806", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7041601535210082, "ground_truth": 0}, {"key": "38329806", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.675764620579946, "ground_truth": 0}, {"key": "38329806", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581687527419, "ground_truth": 0}, {"key": "38329806", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149854733831, "ground_truth": 0}, {"key": "38761942", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7520125573470836, "ground_truth": 0}, {"key": "38761942", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568123009503263, "ground_truth": 0}, {"key": "38761942", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8438951002570461, "ground_truth": 0}, {"key": "38761942", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840388101408, "ground_truth": 0}, {"key": "38761942", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386691065492268, "ground_truth": 0}, {"key": "33773576", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.620621613737067, "ground_truth": 0}, {"key": "33773576", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6601723961204807, "ground_truth": 0}, {"key": "33773576", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5717665881847316, "ground_truth": 0}, {"key": "33773576", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185169409545, "ground_truth": 0}, {"key": "33773576", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.793105960474179, "ground_truth": 0}, {"key": "37642631", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6169358410998639, "ground_truth": 0}, {"key": "37642631", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754631823055, "ground_truth": 0}, {"key": "37642631", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.665410574990555, "ground_truth": 0}, {"key": "37642631", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442250988191157, "ground_truth": 0}, {"key": "37642631", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494577094283, "ground_truth": 0}, {"key": "36609836", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8244619280139114, "ground_truth": 0}, {"key": "36609836", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7704647809685569, "ground_truth": 0}, {"key": "36609836", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9329437083038459, "ground_truth": 0}, {"key": "36609836", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127428957459, "ground_truth": 0}, {"key": "36609836", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284027299844, "ground_truth": 0}, {"key": "41035610", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7956580944593665, "ground_truth": 0}, {"key": "41035610", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6825737567433597, "ground_truth": 0}, {"key": "41035610", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6943026710156996, "ground_truth": 0}, {"key": "41035610", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493175625427, "ground_truth": 0}, {"key": "41035610", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059542563071, "ground_truth": 0}, {"key": "37592684", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6584174955122842, "ground_truth": 0}, {"key": "37592684", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7866228270675021, "ground_truth": 0}, {"key": "37592684", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506705651167, "ground_truth": 0}, {"key": "37592684", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059366457499, "ground_truth": 0}, {"key": "37592684", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267824638952, "ground_truth": 0}, {"key": "38951040", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104789061721797, "ground_truth": 0}, {"key": "38951040", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6548947268829474, "ground_truth": 0}, {"key": "38951040", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7704647542240863, "ground_truth": 0}, {"key": "38951040", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933453926247, "ground_truth": 0}, {"key": "38951040", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920076822295, "ground_truth": 0}, {"key": "40774469", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5486734973282504, "ground_truth": 0}, {"key": "40774469", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5660185160144594, "ground_truth": 0}, {"key": "40774469", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6791786800404024, "ground_truth": 0}, {"key": "40774469", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.684264054581307, "ground_truth": 0}, {"key": "40774469", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916239884371, "ground_truth": 0}, {"key": "40876288", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8449215204690427, "ground_truth": 0}, {"key": "40876288", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8019358148520659, "ground_truth": 0}, {"key": "40876288", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7799928842592705, "ground_truth": 0}, {"key": "40876288", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808785958496554, "ground_truth": 0}, {"key": "40876288", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689350171874, "ground_truth": 0}, {"key": "40340131", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8749346202886593, "ground_truth": 0}, {"key": "40340131", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437709499531, "ground_truth": 0}, {"key": "40340131", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388251843488, "ground_truth": 0}, {"key": "40340131", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321801789156, "ground_truth": 0}, {"key": "40340131", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163585115444, "ground_truth": 0}, {"key": "30121591", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7341195318354434, "ground_truth": 0}, {"key": "30121591", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7461390138862103, "ground_truth": 0}, {"key": "30121591", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7057850372402635, "ground_truth": 0}, {"key": "30121591", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339617658589, "ground_truth": 0}, {"key": "30121591", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493067333855, "ground_truth": 0}, {"key": "35623366", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8688267751731645, "ground_truth": 0}, {"key": "35623366", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7759445552421408, "ground_truth": 0}, {"key": "35623366", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772271867757, "ground_truth": 0}, {"key": "35623366", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936280603361, "ground_truth": 0}, {"key": "35623366", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928967612144, "ground_truth": 0}, {"key": "41014093", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8661325122067381, "ground_truth": 0}, {"key": "41014093", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8019358219306989, "ground_truth": 0}, {"key": "41014093", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8509646947923443, "ground_truth": 0}, {"key": "41014093", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998608451461, "ground_truth": 0}, {"key": "41014093", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357525054184, "ground_truth": 0}, {"key": "11387984", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6959583329358358, "ground_truth": 0}, {"key": "11387984", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7505527533562217, "ground_truth": 0}, {"key": "11387984", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.834406894463661, "ground_truth": 0}, {"key": "11387984", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526224469759, "ground_truth": 0}, {"key": "11387984", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578303715026, "ground_truth": 0}, {"key": "39508312", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7185943836437181, "ground_truth": 0}, {"key": "39508312", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8289388130292141, "ground_truth": 0}, {"key": "39508312", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7662936492964372, "ground_truth": 0}, {"key": "39508312", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.804405918250776, "ground_truth": 0}, {"key": "39508312", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582767224967, "ground_truth": 0}, {"key": "35815369", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897234348356, "ground_truth": 0}, {"key": "35815369", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187367830528475, "ground_truth": 0}, {"key": "35815369", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377725588925, "ground_truth": 0}, {"key": "35815369", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681007827085, "ground_truth": 0}, {"key": "35815369", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673335086758, "ground_truth": 0}, {"key": "35802823", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7170119020814433, "ground_truth": 0}, {"key": "35802823", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8910549605835848, "ground_truth": 0}, {"key": "35802823", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743801734915, "ground_truth": 0}, {"key": "35802823", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493139908905, "ground_truth": 0}, {"key": "35802823", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.874934614857099, "ground_truth": 0}, {"key": "38499968", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7981867873706511, "ground_truth": 0}, {"key": "38499968", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7563575777944037, "ground_truth": 0}, {"key": "38499968", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8469578511520681, "ground_truth": 0}, {"key": "38499968", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943770012179, "ground_truth": 0}, {"key": "38499968", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802601538387, "ground_truth": 0}, {"key": "36926726", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7905303261213984, "ground_truth": 0}, {"key": "36926726", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8278281546264191, "ground_truth": 0}, {"key": "36926726", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7279754228334884, "ground_truth": 0}, {"key": "36926726", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068670211858, "ground_truth": 0}, {"key": "36926726", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825870350983, "ground_truth": 0}, {"key": "40903712", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704647825079283, "ground_truth": 0}, {"key": "40903712", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7634837725071133, "ground_truth": 0}, {"key": "40903712", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7185943772330811, "ground_truth": 0}, {"key": "40903712", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898409022828, "ground_truth": 0}, {"key": "40903712", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.787931190180124, "ground_truth": 0}, {"key": "19614862", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6842640157868386, "ground_truth": 0}, {"key": "19614862", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4707365892398216, "ground_truth": 0}, {"key": "19614862", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7217431936704461, "ground_truth": 0}, {"key": "19614862", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646146347704, "ground_truth": 0}, {"key": "19614862", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "38861704", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575436864786, "ground_truth": 0}, {"key": "38861704", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5679366000626462, "ground_truth": 0}, {"key": "38861704", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7759445704806625, "ground_truth": 0}, {"key": "38861704", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.638835273754583, "ground_truth": 0}, {"key": "38861704", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299987444304, "ground_truth": 0}, {"key": "34349607", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6513548905633054, "ground_truth": 0}, {"key": "34349607", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5621765057842489, "ground_truth": 0}, {"key": "34349607", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6039318385831958, "ground_truth": 0}, {"key": "34349607", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762712443812, "ground_truth": 0}, {"key": "34349607", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082594865074, "ground_truth": 0}, {"key": "20773800", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.4902356251574435, "ground_truth": 0}, {"key": "20773800", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4244120013545452, "ground_truth": 0}, {"key": "20773800", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.3793783924403449, "ground_truth": 0}, {"key": "20773800", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4746311675204434, "ground_truth": 0}, {"key": "20773800", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121409763222, "ground_truth": 0}, {"key": "35545608", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876299852068228, "ground_truth": 0}, {"key": "35545608", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5467381785951664, "ground_truth": 0}, {"key": "35545608", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5869964330512352, "ground_truth": 0}, {"key": "35545608", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413710600059, "ground_truth": 0}, {"key": "35545608", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504991898753, "ground_truth": 0}, {"key": "37258984", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6740504647826078, "ground_truth": 0}, {"key": "37258984", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6688802605755487, "ground_truth": 0}, {"key": "37258984", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6057990616801573, "ground_truth": 0}, {"key": "37258984", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154240072900382, "ground_truth": 0}, {"key": "37258984", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702832029421, "ground_truth": 0}, {"key": "37274562", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897321992283, "ground_truth": 0}, {"key": "37274562", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7341195415773674, "ground_truth": 0}, {"key": "37274562", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.816406388560363, "ground_truth": 0}, {"key": "37274562", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423402639549, "ground_truth": 0}, {"key": "37274562", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493369410273, "ground_truth": 0}, {"key": "40828068", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.913676524661023, "ground_truth": 0}, {"key": "40828068", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.917302659242326, "ground_truth": 0}, {"key": "40828068", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388074912638, "ground_truth": 0}, {"key": "40828068", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142421121725, "ground_truth": 0}, {"key": "40828068", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531129441416, "ground_truth": 0}, {"key": "37807180", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9294404009068615, "ground_truth": 0}, {"key": "37807180", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9437636511810182, "ground_truth": 0}, {"key": "37807180", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9458012719416304, "ground_truth": 0}, {"key": "37807180", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9504109734062797, "ground_truth": 0}, {"key": "37807180", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9445872046790011, "ground_truth": 0}, {"key": "40748607", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9485372336500146, "ground_truth": 0}, {"key": "40748607", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9539661019481073, "ground_truth": 0}, {"key": "40748607", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9515039998941417, "ground_truth": 0}, {"key": "40748607", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9678992910240225, "ground_truth": 0}, {"key": "40748607", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9539661012129413, "ground_truth": 0}, {"key": "40123819", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9263037277147511, "ground_truth": 0}, {"key": "40123819", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.847967756682549, "ground_truth": 0}, {"key": "40123819", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9046505433098192, "ground_truth": 0}, {"key": "40123819", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314768679392, "ground_truth": 0}, {"key": "40123819", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585829228679, "ground_truth": 0}, {"key": "38453867", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849616195844, "ground_truth": 0}, {"key": "38453867", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267117847948987, "ground_truth": 0}, {"key": "38453867", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7732163888905796, "ground_truth": 0}, {"key": "38453867", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677612489288, "ground_truth": 0}, {"key": "38453867", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325091459375, "ground_truth": 0}, {"key": "38944856", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9314625123207494, "ground_truth": 0}, {"key": "38944856", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9213576196282782, "ground_truth": 0}, {"key": "38944856", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8824278677596259, "ground_truth": 0}, {"key": "38944856", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9407897537261359, "ground_truth": 0}, {"key": "38944856", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675447342065, "ground_truth": 0}, {"key": "35778898", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086179009638075, "ground_truth": 0}, {"key": "35778898", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8955226824084938, "ground_truth": 0}, {"key": "35778898", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006919848147662, "ground_truth": 0}, {"key": "35778898", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743713427295, "ground_truth": 0}, {"key": "35778898", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.926835276552149, "ground_truth": 0}, {"key": "32530125", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6548947292279249, "ground_truth": 0}, {"key": "32530125", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6370307897574513, "ground_truth": 0}, {"key": "32530125", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5832033539058826, "ground_truth": 0}, {"key": "32530125", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.753466657641654, "ground_truth": 0}, {"key": "32530125", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582745484927, "ground_truth": 0}, {"key": "35010363", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.677474040170379, "ground_truth": 0}, {"key": "35010363", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6020615938243679, "ground_truth": 0}, {"key": "35010363", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5544704530697735, "ground_truth": 0}, {"key": "35010363", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909763080602643, "ground_truth": 0}, {"key": "35010363", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174975430487, "ground_truth": 0}, {"key": "27514800", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835469746836, "ground_truth": 0}, {"key": "27514800", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511512736736, "ground_truth": 0}, {"key": "27514800", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8587186031570326, "ground_truth": 0}, {"key": "27514800", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624725719344, "ground_truth": 0}, {"key": "27514800", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337006450736, "ground_truth": 0}, {"key": "25725840", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.4225046156184929, "ground_truth": 0}, {"key": "25725840", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5448013698083071, "ground_truth": 0}, {"key": "25725840", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6531269423840641, "ground_truth": 0}, {"key": "25725840", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916056517245, "ground_truth": 0}, {"key": "25725840", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794003900408439, "ground_truth": 0}, {"key": "38327225", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8031737993620792, "ground_truth": 0}, {"key": "38327225", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872055489409, "ground_truth": 0}, {"key": "38327225", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8407825941098117, "ground_truth": 0}, {"key": "38327225", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117963220845, "ground_truth": 0}, {"key": "38327225", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528023043059, "ground_truth": 0}, {"key": "11991724", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8068526058207754, "ground_truth": 0}, {"key": "11991724", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7325918234091818, "ground_truth": 0}, {"key": "11991724", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8558511469153814, "ground_truth": 0}, {"key": "11991724", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891074797835, "ground_truth": 0}, {"key": "11991724", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797604040845, "ground_truth": 0}, {"key": "32217545", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6808786071345557, "ground_truth": 0}, {"key": "32217545", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7025300748932455, "ground_truth": 0}, {"key": "32217545", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056321938239149, "ground_truth": 0}, {"key": "32217545", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.79944231737342, "ground_truth": 0}, {"key": "32217545", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544172885546, "ground_truth": 0}, {"key": "12731847", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5945512598697485, "ground_truth": 0}, {"key": "12731847", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6297745924096623, "ground_truth": 0}, {"key": "12731847", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307515536795, "ground_truth": 0}, {"key": "12731847", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432093435903, "ground_truth": 0}, {"key": "12731847", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460136898148873, "ground_truth": 0}, {"key": "36827234", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.756357577385295, "ground_truth": 0}, {"key": "36827234", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998481208296, "ground_truth": 0}, {"key": "36827234", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8529354821186561, "ground_truth": 0}, {"key": "36827234", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624526452303, "ground_truth": 0}, {"key": "36827234", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916156473673, "ground_truth": 0}, {"key": "29111539", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407825800922223, "ground_truth": 0}, {"key": "29111539", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9073122142776977, "ground_truth": 0}, {"key": "29111539", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9032942085464193, "ground_truth": 0}, {"key": "29111539", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846317845321, "ground_truth": 0}, {"key": "29111539", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647047061599, "ground_truth": 0}, {"key": "37763052", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6370308061097661, "ground_truth": 0}, {"key": "37763052", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159269456487, "ground_truth": 0}, {"key": "37763052", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7732163592127606, "ground_truth": 0}, {"key": "37763052", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.769080230840659, "ground_truth": 0}, {"key": "37763052", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303145895677, "ground_truth": 0}, {"key": "30682335", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5736784027402964, "ground_truth": 0}, {"key": "30682335", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7154240006932926, "ground_truth": 0}, {"key": "30682335", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.594551223227834, "ground_truth": 0}, {"key": "30682335", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984962242809, "ground_truth": 0}, {"key": "30682335", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331343069394, "ground_truth": 0}, {"key": "12261276", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.32939172094042335, "ground_truth": 0}, {"key": "12261276", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.44167300456741826, "ground_truth": 0}, {"key": "12261276", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.38861802416244945, "ground_truth": 0}, {"key": "12261276", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.394200933048598, "ground_truth": 0}, {"key": "12261276", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734940367723, "ground_truth": 0}, {"key": "36912979", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5292633899571972, "ground_truth": 0}, {"key": "36912979", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6757646027835077, "ground_truth": 0}, {"key": "36912979", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7074046903021858, "ground_truth": 0}, {"key": "36912979", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218815637894525, "ground_truth": 0}, {"key": "36912979", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784182299974, "ground_truth": 0}, {"key": "30205259", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8940517203772732, "ground_truth": 0}, {"key": "30205259", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473863967293, "ground_truth": 0}, {"key": "30205259", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772400363037, "ground_truth": 0}, {"key": "30205259", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923161067158, "ground_truth": 0}, {"key": "30205259", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.893309406587244, "ground_truth": 0}, {"key": "39458032", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9702399097989759, "ground_truth": 0}, {"key": "39458032", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9632305321406598, "ground_truth": 0}, {"key": "39458032", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9618217267866268, "ground_truth": 0}, {"key": "39458032", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9539660959649738, "ground_truth": 0}, {"key": "39458032", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9621075720086789, "ground_truth": 0}, {"key": "35116452", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.766293632015858, "ground_truth": 0}, {"key": "35116452", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850257975073, "ground_truth": 0}, {"key": "35116452", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253646488678, "ground_truth": 0}, {"key": "35116452", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191343461298, "ground_truth": 0}, {"key": "35116452", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163778641173, "ground_truth": 0}, {"key": "40107476", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8233284015585534, "ground_truth": 0}, {"key": "40107476", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.89029421739843, "ground_truth": 0}, {"key": "40107476", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267117896247678, "ground_truth": 0}, {"key": "40107476", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.884837766795257, "ground_truth": 0}, {"key": "40107476", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339773137599, "ground_truth": 0}, {"key": "39501049", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9304582645519516, "ground_truth": 0}, {"key": "39501049", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.927363295031472, "ground_truth": 0}, {"key": "39501049", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9518632306129777, "ground_truth": 0}, {"key": "39501049", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9334308179680181, "ground_truth": 0}, {"key": "39501049", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9453993887761658, "ground_truth": 0}, {"key": "39642178", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6442250814452698, "ground_truth": 0}, {"key": "39642178", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4960938456096452, "ground_truth": 0}, {"key": "39642178", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.564098499215316, "ground_truth": 0}, {"key": "39642178", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754673196134, "ground_truth": 0}, {"key": "39642178", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704691537714, "ground_truth": 0}, {"key": "38024796", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6206216032558547, "ground_truth": 0}, {"key": "38024796", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6825737334220277, "ground_truth": 0}, {"key": "38024796", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.734119528381046, "ground_truth": 0}, {"key": "38024796", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920227384974, "ground_truth": 0}, {"key": "38024796", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850182737883, "ground_truth": 0}, {"key": "36652079", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6057990378508604, "ground_truth": 0}, {"key": "36652079", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7025300543206853, "ground_truth": 0}, {"key": "36652079", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5621764612182408, "ground_truth": 0}, {"key": "36652079", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711766115258, "ground_truth": 0}, {"key": "36652079", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852883209829117, "ground_truth": 0}, {"key": "32193402", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8233284158483318, "ground_truth": 0}, {"key": "32193402", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7577943765213484, "ground_truth": 0}, {"key": "32193402", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8164063643507006, "ground_truth": 0}, {"key": "32193402", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748504383053, "ground_truth": 0}, {"key": "32193402", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284182375349, "ground_truth": 0}, {"key": "32589706", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8489722050768508, "ground_truth": 0}, {"key": "32589706", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8509646976940282, "ground_truth": 0}, {"key": "32589706", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9053222935733701, "ground_truth": 0}, {"key": "32589706", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677494685061, "ground_truth": 0}, {"key": "32589706", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240876380421, "ground_truth": 0}, {"key": "38590589", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666373712524, "ground_truth": 0}, {"key": "38590589", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125557486251, "ground_truth": 0}, {"key": "38590589", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998720731092, "ground_truth": 0}, {"key": "38590589", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672137886068, "ground_truth": 0}, {"key": "38590589", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036145640971, "ground_truth": 0}, {"key": "37045414", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9835969680285549, "ground_truth": 0}, {"key": "37045414", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9861513901937928, "ground_truth": 0}, {"key": "37045414", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9726235084949917, "ground_truth": 0}, {"key": "37045414", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9808759638153722, "ground_truth": 0}, {"key": "37045414", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9838471637425555, "ground_truth": 0}, {"key": "33310095", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9190632936780485, "ground_truth": 0}, {"key": "33310095", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8984105486386015, "ground_truth": 0}, {"key": "33310095", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631373769282, "ground_truth": 0}, {"key": "33310095", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513727774344, "ground_truth": 0}, {"key": "33310095", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122138119725, "ground_truth": 0}, {"key": "37934604", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7476159451684775, "ground_truth": 0}, {"key": "37934604", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.737158193391377, "ground_truth": 0}, {"key": "37934604", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031737924049538, "ground_truth": 0}, {"key": "37934604", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306178410196, "ground_truth": 0}, {"key": "37934604", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511530581348, "ground_truth": 0}, {"key": "39012181", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.992304353651554, "ground_truth": 0}, {"key": "39012181", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9902161245539346, "ground_truth": 0}, {"key": "39012181", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9885803854799617, "ground_truth": 0}, {"key": "39012181", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9925969857470336, "ground_truth": 0}, {"key": "39012181", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9918752913198926, "ground_truth": 0}, {"key": "40221674", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9420819141597948, "ground_truth": 0}, {"key": "40221674", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8816149068001503, "ground_truth": 0}, {"key": "40221674", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9284088035499137, "ground_truth": 0}, {"key": "40221674", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343738280872, "ground_truth": 0}, {"key": "40221674", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012695313852, "ground_truth": 0}, {"key": "36884862", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.883235985430412, "ground_truth": 0}, {"key": "36884862", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8918110471289358, "ground_truth": 0}, {"key": "36884862", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9105453953221575, "ground_truth": 0}, {"key": "36884862", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070075361979, "ground_truth": 0}, {"key": "36884862", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.879974375252081, "ground_truth": 0}, {"key": "39054429", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445517539575, "ground_truth": 0}, {"key": "39054429", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8688267832639983, "ground_truth": 0}, {"key": "39054429", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7718434931044164, "ground_truth": 0}, {"key": "39054429", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956580997013567, "ground_truth": 0}, {"key": "39054429", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580916399133, "ground_truth": 0}, {"key": "36753964", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8152324988869434, "ground_truth": 0}, {"key": "36753964", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8006919863402807, "ground_truth": 0}, {"key": "36753964", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7170118698549869, "ground_truth": 0}, {"key": "36753964", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307878022364, "ground_truth": 0}, {"key": "36753964", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.823328408805308, "ground_truth": 0}, {"key": "37612459", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8489721972030461, "ground_truth": 0}, {"key": "37612459", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9149009609887617, "ground_truth": 0}, {"key": "37612459", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8661325136998934, "ground_truth": 0}, {"key": "37612459", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797533772168, "ground_truth": 0}, {"key": "37612459", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142537502266, "ground_truth": 0}, {"key": "36805789", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8864204137558727, "ground_truth": 0}, {"key": "36805789", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9546474231135715, "ground_truth": 0}, {"key": "36805789", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9445872047255458, "ground_truth": 0}, {"key": "36805789", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823379522731, "ground_truth": 0}, {"key": "36805789", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299521439448, "ground_truth": 0}, {"key": "12757394", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7634837522711481, "ground_truth": 0}, {"key": "12757394", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8499711678775397, "ground_truth": 0}, {"key": "12757394", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104789037007947, "ground_truth": 0}, {"key": "12757394", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835323243054, "ground_truth": 0}, {"key": "12757394", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.702530044458968, "ground_truth": 0}, {"key": "32192542", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9543079673764339, "ground_truth": 0}, {"key": "32192542", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9559813473108135, "ground_truth": 0}, {"key": "32192542", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9645892693496542, "ground_truth": 0}, {"key": "32192542", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9582261170006409, "ground_truth": 0}, {"key": "32192542", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9569571500125276, "ground_truth": 0}, {"key": "34856060", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.501953093848794, "ground_truth": 0}, {"key": "34856060", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.443600441158731, "ground_truth": 0}, {"key": "34856060", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7264256053241588, "ground_truth": 0}, {"key": "34856060", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324864857078, "ground_truth": 0}, {"key": "34856060", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737244344249, "ground_truth": 0}, {"key": "36083416", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8976952903542261, "ground_truth": 0}, {"key": "36083416", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8740772325997025, "ground_truth": 0}, {"key": "36083416", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8998277808144018, "ground_truth": 0}, {"key": "36083416", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587948448353, "ground_truth": 0}, {"key": "36083416", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297903304202, "ground_truth": 0}, {"key": "33839050", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6297746167870288, "ground_truth": 0}, {"key": "33839050", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5660185253473005, "ground_truth": 0}, {"key": "33839050", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297746064828428, "ground_truth": 0}, {"key": "33839050", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073828641894, "ground_truth": 0}, {"key": "33839050", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909763111509329, "ground_truth": 0}, {"key": "18464690", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7416740181923853, "ground_truth": 0}, {"key": "18464690", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7431679982851529, "ground_truth": 0}, {"key": "18464690", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7416740028371607, "ground_truth": 0}, {"key": "18464690", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953519820138, "ground_truth": 0}, {"key": "18464690", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185650672803, "ground_truth": 0}, {"key": "39212665", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876299980105148, "ground_truth": 0}, {"key": "39212665", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5273165268529547, "ground_truth": 0}, {"key": "39212665", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5195213217556336, "ground_truth": 0}, {"key": "39212665", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047005983027, "ground_truth": 0}, {"key": "39212665", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269140487836, "ground_truth": 0}, {"key": "40094011", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7969253606407897, "ground_truth": 0}, {"key": "40094011", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.799442310172913, "ground_truth": 0}, {"key": "40094011", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8300437765112909, "ground_truth": 0}, {"key": "40094011", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321923471194, "ground_truth": 0}, {"key": "40094011", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640314026576, "ground_truth": 0}, {"key": "36036272", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8044059242521935, "ground_truth": 0}, {"key": "36036272", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8397339844883325, "ground_truth": 0}, {"key": "36036272", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367693184432, "ground_truth": 0}, {"key": "36036272", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284026461889, "ground_truth": 0}, {"key": "36036272", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754530906449, "ground_truth": 0}, {"key": "30681904", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.665410554780824, "ground_truth": 0}, {"key": "30681904", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909762916631765, "ground_truth": 0}, {"key": "30681904", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7981867786076428, "ground_truth": 0}, {"key": "30681904", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.740174372698597, "ground_truth": 0}, {"key": "30681904", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197699729227, "ground_truth": 0}, {"key": "27834240", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802452556811, "ground_truth": 0}, {"key": "27834240", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892336886274817, "ground_truth": 0}, {"key": "27834240", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7745833853933619, "ground_truth": 0}, {"key": "27834240", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493014811888, "ground_truth": 0}, {"key": "27834240", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206215941324535, "ground_truth": 0}, {"key": "35025075", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7853085905588182, "ground_truth": 0}, {"key": "35025075", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8984105469045529, "ground_truth": 0}, {"key": "35025075", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8386797608244367, "ground_truth": 0}, {"key": "35025075", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239767200147, "ground_truth": 0}, {"key": "35025075", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.759225422388844, "ground_truth": 0}, {"key": "33316985", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382126457161, "ground_truth": 0}, {"key": "33316985", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8365545653660698, "ground_truth": 0}, {"key": "33316985", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140527895682396, "ground_truth": 0}, {"key": "33316985", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849605575999, "ground_truth": 0}, {"key": "33316985", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.737158159609219, "ground_truth": 0}, {"key": "17037056", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.571766601414437, "ground_truth": 0}, {"key": "17037056", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5679366000882102, "ground_truth": 0}, {"key": "17037056", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.4921881260854291, "ground_truth": 0}, {"key": "17037056", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023561556813516, "ground_truth": 0}, {"key": "17037056", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175709062473582, "ground_truth": 0}, {"key": "34050457", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8080672065138709, "ground_truth": 0}, {"key": "34050457", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568122838272457, "ground_truth": 0}, {"key": "34050457", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8824278639481189, "ground_truth": 0}, {"key": "34050457", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366587687774, "ground_truth": 0}, {"key": "34050457", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312011869521, "ground_truth": 0}, {"key": "34713745", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7520125794624507, "ground_truth": 0}, {"key": "34713745", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6113819866444999, "ground_truth": 0}, {"key": "34713745", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7106283187114517, "ground_truth": 0}, {"key": "34713745", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581636086957, "ground_truth": 0}, {"key": "34713745", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647917052602, "ground_truth": 0}, {"key": "40856210", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5019531159929865, "ground_truth": 0}, {"key": "40856210", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5660185460791961, "ground_truth": 0}, {"key": "40856210", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5448013807710345, "ground_truth": 0}, {"key": "40856210", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585904812194, "ground_truth": 0}, {"key": "40856210", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256138408123, "ground_truth": 0}, {"key": "40848302", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6723316779304882, "ground_truth": 0}, {"key": "40848302", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159692884486, "ground_truth": 0}, {"key": "40848302", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6531269088627616, "ground_truth": 0}, {"key": "40848302", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762928564542, "ground_truth": 0}, {"key": "40848302", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601319488147, "ground_truth": 0}, {"key": "40636168", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7718435050577934, "ground_truth": 0}, {"key": "40636168", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8489721883345046, "ground_truth": 0}, {"key": "40636168", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8624675289996949, "ground_truth": 0}, {"key": "40636168", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423123109761, "ground_truth": 0}, {"key": "40636168", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837570673625, "ground_truth": 0}, {"key": "34423311", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8006919974082373, "ground_truth": 0}, {"key": "34423311", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7233094903178088, "ground_truth": 0}, {"key": "34423311", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.667147687945376, "ground_truth": 0}, {"key": "34423311", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.631594324901312, "ground_truth": 0}, {"key": "34423311", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787352994704, "ground_truth": 0}, {"key": "34833945", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9753900675476559, "ground_truth": 0}, {"key": "34833945", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9802808721725617, "ground_truth": 0}, {"key": "34833945", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9643214469130511, "ground_truth": 0}, {"key": "34833945", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9777138158151246, "ground_truth": 0}, {"key": "34833945", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9676556655096454, "ground_truth": 0}, {"key": "21272328", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6187804247616631, "ground_truth": 0}, {"key": "21272328", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8697145839173461, "ground_truth": 0}, {"key": "21272328", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7577943857255918, "ground_truth": 0}, {"key": "21272328", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948139800452, "ground_truth": 0}, {"key": "21272328", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544124520224, "ground_truth": 0}, {"key": "38648957", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7154239966562428, "ground_truth": 0}, {"key": "38648957", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6442251150130129, "ground_truth": 0}, {"key": "38648957", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7310585721678076, "ground_truth": 0}, {"key": "38648957", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948434057978, "ground_truth": 0}, {"key": "38648957", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593446064579, "ground_truth": 0}, {"key": "24942981", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5525397389861643, "ground_truth": 0}, {"key": "24942981", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.439747331377833, "ground_truth": 0}, {"key": "24942981", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5234203241814517, "ground_truth": 0}, {"key": "24942981", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666370711797, "ground_truth": 0}, {"key": "24942981", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878322618234, "ground_truth": 0}, {"key": "35882366", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6477982153542177, "ground_truth": 0}, {"key": "35882366", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8918110480894806, "ground_truth": 0}, {"key": "35882366", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7279754514507518, "ground_truth": 0}, {"key": "35882366", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.814052791350496, "ground_truth": 0}, {"key": "35882366", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159484858641, "ground_truth": 0}, {"key": "40559523", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849636718434, "ground_truth": 0}, {"key": "40559523", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7549149893087327, "ground_truth": 0}, {"key": "40559523", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8221891341495524, "ground_truth": 0}, {"key": "40559523", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239976631261, "ground_truth": 0}, {"key": "40559523", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737841693627, "ground_truth": 0}, {"key": "24632722", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7981867647855019, "ground_truth": 0}, {"key": "24632722", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6315943060913617, "ground_truth": 0}, {"key": "24632722", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5813031341130259, "ground_truth": 0}, {"key": "24632722", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.741674014636145, "ground_truth": 0}, {"key": "24632722", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563440984284, "ground_truth": 0}, {"key": "36002759", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6842640578925929, "ground_truth": 0}, {"key": "36002759", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5851011587912914, "ground_truth": 0}, {"key": "36002759", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.805632175516669, "ground_truth": 0}, {"key": "36002759", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984925517467, "ground_truth": 0}, {"key": "36002759", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203705451262, "ground_truth": 0}, {"key": "29508534", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835430864997, "ground_truth": 0}, {"key": "29508534", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7745833891361316, "ground_truth": 0}, {"key": "29508534", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.766293647336233, "ground_truth": 0}, {"key": "29508534", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445409969784, "ground_truth": 0}, {"key": "29508534", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490871839614985, "ground_truth": 0}, {"key": "15631612", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7634837657649346, "ground_truth": 0}, {"key": "15631612", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7704647889185595, "ground_truth": 0}, {"key": "15631612", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267118022351596, "ground_truth": 0}, {"key": "15631612", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884632977463, "ground_truth": 0}, {"key": "15631612", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897464443358, "ground_truth": 0}, {"key": "40731892", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6020615932122938, "ground_truth": 0}, {"key": "40731892", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5273165293018147, "ground_truth": 0}, {"key": "40731892", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5428632903767637, "ground_truth": 0}, {"key": "40731892", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241556161607, "ground_truth": 0}, {"key": "40731892", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167499056758, "ground_truth": 0}, {"key": "35971910", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8267118016854276, "ground_truth": 0}, {"key": "35971910", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8479677625375062, "ground_truth": 0}, {"key": "35971910", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.826711803889263, "ground_truth": 0}, {"key": "35971910", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278778078279, "ground_truth": 0}, {"key": "35971910", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673068733063, "ground_truth": 0}, {"key": "34428424", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.972204376457439, "ground_truth": 0}, {"key": "34428424", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9722043785057984, "ground_truth": 0}, {"key": "34428424", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9690910392208616, "ground_truth": 0}, {"key": "34428424", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9730365027292084, "ground_truth": 0}, {"key": "34428424", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9575961734811289, "ground_truth": 0}, {"key": "36971005", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9178933663749003, "ground_truth": 0}, {"key": "36971005", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9273632848852441, "ground_truth": 0}, {"key": "36971005", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9536217946058776, "ground_truth": 0}, {"key": "36971005", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797081926494, "ground_truth": 0}, {"key": "36971005", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037289278107, "ground_truth": 0}, {"key": "34649067", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7371581518579563, "ground_truth": 0}, {"key": "34649067", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6297746390899999, "ground_truth": 0}, {"key": "34649067", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297745902946763, "ground_truth": 0}, {"key": "34649067", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224516939048, "ground_truth": 0}, {"key": "34649067", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082846714169, "ground_truth": 0}, {"key": "37355154", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6460137092541143, "ground_truth": 0}, {"key": "37355154", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7839884816309324, "ground_truth": 0}, {"key": "37355154", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6001883671787792, "ground_truth": 0}, {"key": "37355154", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185147379894, "ground_truth": 0}, {"key": "37355154", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624836395907, "ground_truth": 0}, {"key": "38674697", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074047037023209, "ground_truth": 0}, {"key": "38674697", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6150878499962806, "ground_truth": 0}, {"key": "38674697", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6825737407184161, "ground_truth": 0}, {"key": "38674697", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701231131563, "ground_truth": 0}, {"key": "38674697", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476618176708, "ground_truth": 0}, {"key": "40525767", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9916195469036628, "ground_truth": 0}, {"key": "40525767", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9920620056574417, "ground_truth": 0}, {"key": "40525767", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9905142861797972, "ground_truth": 0}, {"key": "40525767", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.983342960718556, "ground_truth": 0}, {"key": "40525767", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9773708000457069, "ground_truth": 0}, {"key": "27165110", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.513668482005892, "ground_truth": 0}, {"key": "27165110", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7310585631840213, "ground_truth": 0}, {"key": "27165110", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6926419994388757, "ground_truth": 0}, {"key": "27165110", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953777771197, "ground_truth": 0}, {"key": "27165110", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824290999756326, "ground_truth": 0}, {"key": "35497491", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7520125739787249, "ground_truth": 0}, {"key": "35497491", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6039318288168919, "ground_truth": 0}, {"key": "35497491", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7074047037692983, "ground_truth": 0}, {"key": "35497491", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324943732644, "ground_truth": 0}, {"key": "35497491", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191296268846, "ground_truth": 0}, {"key": "40690716", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.913058343772138, "ground_truth": 0}, {"key": "40690716", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9190632872218811, "ground_truth": 0}, {"key": "40690716", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.931959577651438, "ground_truth": 0}, {"key": "40690716", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9184802509626055, "ground_truth": 0}, {"key": "40690716", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9289263286686988, "ground_truth": 0}, {"key": "34835193", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9820137902360544, "ground_truth": 0}, {"key": "34835193", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9848109525469423, "ground_truth": 0}, {"key": "34835193", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9832145107353253, "ground_truth": 0}, {"key": "34835193", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9804313252320976, "ground_truth": 0}, {"key": "34835193", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9618217263490553, "ground_truth": 0}, {"key": "39471712", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6909763004982603, "ground_truth": 0}, {"key": "39471712", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7461389841663922, "ground_truth": 0}, {"key": "39471712", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956581083751352, "ground_truth": 0}, {"key": "39471712", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563381960678, "ground_truth": 0}, {"key": "39471712", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740026555724, "ground_truth": 0}, {"key": "39115192", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8902942202536195, "ground_truth": 0}, {"key": "39115192", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8221891204098803, "ground_truth": 0}, {"key": "39115192", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8311430514662608, "ground_truth": 0}, {"key": "39115192", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673148181508, "ground_truth": 0}, {"key": "39115192", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764794083793, "ground_truth": 0}, {"key": "23520673", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5058591112130963, "ground_truth": 0}, {"key": "23520673", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4649015506196189, "ground_truth": 0}, {"key": "23520673", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.726425596612307, "ground_truth": 0}, {"key": "23520673", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224256458046, "ground_truth": 0}, {"key": "23520673", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633154470018836, "ground_truth": 0}, {"key": "35764233", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648916299239199, "ground_truth": 0}, {"key": "35764233", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6513548636960693, "ground_truth": 0}, {"key": "35764233", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7981867612280809, "ground_truth": 0}, {"key": "35764233", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239885100131, "ground_truth": 0}, {"key": "35764233", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254011651111, "ground_truth": 0}, {"key": "35228910", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7371581767630528, "ground_truth": 0}, {"key": "35228910", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6442251247458969, "ground_truth": 0}, {"key": "35228910", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6261241753211801, "ground_truth": 0}, {"key": "35228910", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615704183909, "ground_truth": 0}, {"key": "35228910", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321653998631, "ground_truth": 0}, {"key": "36795599", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9416541506129383, "ground_truth": 0}, {"key": "36795599", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9362850054885702, "ground_truth": 0}, {"key": "36795599", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.959154282568443, "ground_truth": 0}, {"key": "36795599", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9319595787885246, "ground_truth": 0}, {"key": "36795599", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9553191307232155, "ground_truth": 0}, {"key": "38641949", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8661325151286828, "ground_truth": 0}, {"key": "38641949", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8031738101611858, "ground_truth": 0}, {"key": "38641949", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7759445592571584, "ground_truth": 0}, {"key": "38641949", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675373749476, "ground_truth": 0}, {"key": "38641949", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672254061425, "ground_truth": 0}, {"key": "29968443", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9496693657478908, "ground_truth": 0}, {"key": "29968443", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9339146169847863, "ground_truth": 0}, {"key": "29968443", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9489172644962857, "ground_truth": 0}, {"key": "29968443", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9412234454447784, "ground_truth": 0}, {"key": "29968443", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9412234413875972, "ground_truth": 0}, {"key": "21268042", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575617273524, "ground_truth": 0}, {"key": "21268042", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8056321918978269, "ground_truth": 0}, {"key": "21268042", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6859494416030569, "ground_truth": 0}, {"key": "21268042", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367915640408, "ground_truth": 0}, {"key": "21268042", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476621620535, "ground_truth": 0}, {"key": "26808572", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7325918379205104, "ground_truth": 0}, {"key": "26808572", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.49609380897913935, "ground_truth": 0}, {"key": "26808572", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8244619132228824, "ground_truth": 0}, {"key": "26808572", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677619693595, "ground_truth": 0}, {"key": "26808572", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743830364408, "ground_truth": 0}, {"key": "37829390", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.749087227161841, "ground_truth": 0}, {"key": "37829390", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.840782583799584, "ground_truth": 0}, {"key": "37829390", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388127981365, "ground_truth": 0}, {"key": "37829390", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.723309466658626, "ground_truth": 0}, {"key": "37829390", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585599332724, "ground_truth": 0}, {"key": "35716045", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8365545597084205, "ground_truth": 0}, {"key": "35716045", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7592254179850483, "ground_truth": 0}, {"key": "35716045", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8397339647521537, "ground_truth": 0}, {"key": "35716045", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919863828588, "ground_truth": 0}, {"key": "35716045", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637498423105, "ground_truth": 0}, {"key": "34367070", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9079671482827221, "ground_truth": 0}, {"key": "34367070", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8887587915292554, "ground_truth": 0}, {"key": "34367070", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9173026597995508, "ground_truth": 0}, {"key": "34367070", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846416380615, "ground_truth": 0}, {"key": "34367070", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840463045962, "ground_truth": 0}, {"key": "35239748", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9118099557231201, "ground_truth": 0}, {"key": "35239748", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511621232782, "ground_truth": 0}, {"key": "35239748", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.839733979547162, "ground_truth": 0}, {"key": "35239748", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473705322607, "ground_truth": 0}, {"key": "35239748", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9173026537199617, "ground_truth": 0}, {"key": "40421370", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490872010408385, "ground_truth": 0}, {"key": "40421370", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624776779878, "ground_truth": 0}, {"key": "40421370", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835358454723, "ground_truth": 0}, {"key": "40421370", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489722075475029, "ground_truth": 0}, {"key": "40421370", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.810478922744717, "ground_truth": 0}, {"key": "37288396", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8344068829451704, "ground_truth": 0}, {"key": "37288396", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6926419833730448, "ground_truth": 0}, {"key": "37288396", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8499711715614313, "ground_truth": 0}, {"key": "37288396", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367837686175, "ground_truth": 0}, {"key": "37288396", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998663585929, "ground_truth": 0}, {"key": "38903688", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8976952883622452, "ground_truth": 0}, {"key": "38903688", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9167080758119048, "ground_truth": 0}, {"key": "38903688", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8606036123243536, "ground_truth": 0}, {"key": "38903688", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148251529566, "ground_truth": 0}, {"key": "38903688", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528019015122, "ground_truth": 0}, {"key": "28071228", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.926303728248369, "ground_truth": 0}, {"key": "28071228", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9161096087235305, "ground_truth": 0}, {"key": "28071228", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9324533074975951, "ground_truth": 0}, {"key": "28071228", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9416541572006286, "ground_truth": 0}, {"key": "28071228", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473618073244, "ground_truth": 0}, {"key": "36855834", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7826624812376093, "ground_truth": 0}, {"key": "36855834", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892336887139074, "ground_truth": 0}, {"key": "36855834", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6808786198387381, "ground_truth": 0}, {"key": "36855834", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.753466635620184, "ground_truth": 0}, {"key": "36855834", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506361573574, "ground_truth": 0}, {"key": "40548717", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6671476646969492, "ground_truth": 0}, {"key": "40548717", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6297746094389974, "ground_truth": 0}, {"key": "40548717", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7185944152919367, "ground_truth": 0}, {"key": "40548717", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998610474252, "ground_truth": 0}, {"key": "40548717", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.732591823119863, "ground_truth": 0}, {"key": "37051175", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648916102844903, "ground_truth": 0}, {"key": "37051175", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6859494850915143, "ground_truth": 0}, {"key": "37051175", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5117165938530545, "ground_truth": 0}, {"key": "37051175", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948395132234, "ground_truth": 0}, {"key": "37051175", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118727675092, "ground_truth": 0}, {"key": "38882119", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8397339588490575, "ground_truth": 0}, {"key": "38882119", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850364177221, "ground_truth": 0}, {"key": "38882119", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.764891602166354, "ground_truth": 0}, {"key": "38882119", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.810478897948943, "ground_truth": 0}, {"key": "38882119", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306140523051, "ground_truth": 0}, {"key": "19485402", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7476159582247189, "ground_truth": 0}, {"key": "19485402", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8140528166140576, "ground_truth": 0}, {"key": "19485402", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8092759693000773, "ground_truth": 0}, {"key": "19485402", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527572469658, "ground_truth": 0}, {"key": "19485402", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837628574095, "ground_truth": 0}, {"key": "36060907", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8244619193170607, "ground_truth": 0}, {"key": "36060907", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9142907263083386, "ground_truth": 0}, {"key": "36060907", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9026095982450759, "ground_truth": 0}, {"key": "36060907", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067228206728, "ground_truth": 0}, {"key": "36060907", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9339146240478049, "ground_truth": 0}, {"key": "24037309", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9343951652899753, "ground_truth": 0}, {"key": "24037309", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9465966670037153, "ground_truth": 0}, {"key": "24037309", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9722043747503955, "ground_truth": 0}, {"key": "24037309", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9525741242240504, "ground_truth": 0}, {"key": "24037309", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9674102572167957, "ground_truth": 0}, {"key": "35605805", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8140528192120556, "ground_truth": 0}, {"key": "35605805", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9207896697759247, "ground_truth": 0}, {"key": "35605805", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772299460694, "ground_truth": 0}, {"key": "35605805", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324877738022, "ground_truth": 0}, {"key": "35605805", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104505378081, "ground_truth": 0}, {"key": "17706248", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745834020186527, "ground_truth": 0}, {"key": "17706248", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6774740238635444, "ground_truth": 0}, {"key": "17706248", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6460137049011473, "ground_truth": 0}, {"key": "17706248", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.779992912984874, "ground_truth": 0}, {"key": "17706248", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943861332923, "ground_truth": 0}, {"key": "36883559", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8267118096684852, "ground_truth": 0}, {"key": "36883559", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892336839729299, "ground_truth": 0}, {"key": "36883559", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267117843313858, "ground_truth": 0}, {"key": "36883559", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339612807599, "ground_truth": 0}, {"key": "36883559", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215432692914, "ground_truth": 0}, {"key": "32799471", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7813306005262086, "ground_truth": 0}, {"key": "32799471", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357643260609, "ground_truth": 0}, {"key": "32799471", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8233284101669829, "ground_truth": 0}, {"key": "32799471", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916078180629, "ground_truth": 0}, {"key": "32799471", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905302922408105, "ground_truth": 0}, {"key": "34797243", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6132365344430445, "ground_truth": 0}, {"key": "34797243", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.640635835466039, "ground_truth": 0}, {"key": "34797243", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7025300587230406, "ground_truth": 0}, {"key": "34797243", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203534013622, "ground_truth": 0}, {"key": "34797243", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704478394624, "ground_truth": 0}, {"key": "32154876", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673147150898, "ground_truth": 0}, {"key": "32154876", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187367880221328, "ground_truth": 0}, {"key": "32154876", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8068526227833412, "ground_truth": 0}, {"key": "32154876", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297745953397503, "ground_truth": 0}, {"key": "32154876", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835465536075, "ground_truth": 0}, {"key": "37962274", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876300138631116, "ground_truth": 0}, {"key": "37962274", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6477982227855059, "ground_truth": 0}, {"key": "37962274", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140528126622956, "ground_truth": 0}, {"key": "37962274", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982176479647, "ground_truth": 0}, {"key": "37962274", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666675541306, "ground_truth": 0}, {"key": "35574030", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9012274106588327, "ground_truth": 0}, {"key": "35574030", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473842560739, "ground_truth": 0}, {"key": "35574030", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9026096033347512, "ground_truth": 0}, {"key": "35574030", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366535329482, "ground_truth": 0}, {"key": "35574030", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359978752802, "ground_truth": 0}, {"key": "39105949", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9184802488351619, "ground_truth": 0}, {"key": "39105949", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9235923160629324, "ground_truth": 0}, {"key": "39105949", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9241418191028301, "ground_truth": 0}, {"key": "39105949", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9343951627877886, "ground_truth": 0}, {"key": "39105949", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288508073315, "ground_truth": 0}, {"key": "41064322", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9224823457785306, "ground_truth": 0}, {"key": "41064322", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9556514194573597, "ground_truth": 0}, {"key": "41064322", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9394706059552839, "ground_truth": 0}, {"key": "41064322", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9489172625281667, "ground_truth": 0}, {"key": "41064322", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.957596170525629, "ground_truth": 0}, {"key": "28105101", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7401743564280142, "ground_truth": 0}, {"key": "28105101", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6654105328662278, "ground_truth": 0}, {"key": "28105101", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6352224213015764, "ground_truth": 0}, {"key": "28105101", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105458964564, "ground_truth": 0}, {"key": "28105101", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004357281232, "ground_truth": 0}, {"key": "36036068", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6279512228704377, "ground_truth": 0}, {"key": "36036068", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7074047120481209, "ground_truth": 0}, {"key": "36036068", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253670731565, "ground_truth": 0}, {"key": "36036068", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.702530055495488, "ground_truth": 0}, {"key": "36036068", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254117656629, "ground_truth": 0}, {"key": "37991460", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7520125766516264, "ground_truth": 0}, {"key": "37991460", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8140528029646131, "ground_truth": 0}, {"key": "37991460", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094788036629, "ground_truth": 0}, {"key": "37991460", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382180099797, "ground_truth": 0}, {"key": "37991460", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036238591754, "ground_truth": 0}, {"key": "38437830", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7185943978349845, "ground_truth": 0}, {"key": "38437830", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8210441028758596, "ground_truth": 0}, {"key": "38437830", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267117871943691, "ground_truth": 0}, {"key": "38437830", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059232189906, "ground_truth": 0}, {"key": "38437830", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748711500504, "ground_truth": 0}, {"key": "36507138", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.856812289704314, "ground_truth": 0}, {"key": "36507138", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5888891339183205, "ground_truth": 0}, {"key": "36507138", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7248703063764204, "ground_truth": 0}, {"key": "36507138", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.789233679886636, "ground_truth": 0}, {"key": "36507138", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434970649996, "ground_truth": 0}, {"key": "37824866", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8509646961169938, "ground_truth": 0}, {"key": "37824866", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187368054734419, "ground_truth": 0}, {"key": "37824866", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6808786140213705, "ground_truth": 0}, {"key": "37824866", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118787508802, "ground_truth": 0}, {"key": "37824866", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585890429148, "ground_truth": 0}, {"key": "25088134", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5774953473180532, "ground_truth": 0}, {"key": "25088134", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.627951231704641, "ground_truth": 0}, {"key": "25088134", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7549149862994804, "ground_truth": 0}, {"key": "25088134", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802474990422, "ground_truth": 0}, {"key": "25088134", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740289967516, "ground_truth": 0}, {"key": "40172531", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6943026822301374, "ground_truth": 0}, {"key": "40172531", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7918210655076753, "ground_truth": 0}, {"key": "40172531", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.848972207371942, "ground_truth": 0}, {"key": "40172531", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.842863135309578, "ground_truth": 0}, {"key": "40172531", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437851202774, "ground_truth": 0}, {"key": "37035874", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6859494609096478, "ground_truth": 0}, {"key": "37035874", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333245823197194, "ground_truth": 0}, {"key": "37035874", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8479677493666977, "ground_truth": 0}, {"key": "37035874", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281520510138, "ground_truth": 0}, {"key": "37035874", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998643622837, "ground_truth": 0}, {"key": "36404465", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9717790133966357, "ground_truth": 0}, {"key": "36404465", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9609517100327034, "ground_truth": 0}, {"key": "36404465", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9603611585816454, "ground_truth": 0}, {"key": "36404465", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9777138175673422, "ground_truth": 0}, {"key": "36404465", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9724147166675183, "ground_truth": 0}, {"key": "39602052", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8548846321863619, "ground_truth": 0}, {"key": "39602052", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437562613935, "ground_truth": 0}, {"key": "39602052", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835323441602, "ground_truth": 0}, {"key": "39602052", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759942841768, "ground_truth": 0}, {"key": "39602052", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382017710883, "ground_truth": 0}, {"key": "33792789", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7866228395723914, "ground_truth": 0}, {"key": "33792789", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7690802329493204, "ground_truth": 0}, {"key": "33792789", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7879312224610474, "ground_truth": 0}, {"key": "33792789", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869793751728, "ground_truth": 0}, {"key": "33792789", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.825589724113691, "ground_truth": 0}, {"key": "32776626", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7310585736195557, "ground_truth": 0}, {"key": "32776626", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5602526552904177, "ground_truth": 0}, {"key": "32776626", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.42250464412287264, "ground_truth": 0}, {"key": "32776626", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009628425065, "ground_truth": 0}, {"key": "32776626", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646162796084, "ground_truth": 0}, {"key": "37195090", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6808786073358946, "ground_truth": 0}, {"key": "37195090", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6688802515614786, "ground_truth": 0}, {"key": "37195090", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.672331699535798, "ground_truth": 0}, {"key": "37195090", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918544312481, "ground_truth": 0}, {"key": "37195090", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632773215952, "ground_truth": 0}, {"key": "33981824", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.845942436384775, "ground_truth": 0}, {"key": "33981824", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.770464793271349, "ground_truth": 0}, {"key": "33981824", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.744656348873764, "ground_truth": 0}, {"key": "33981824", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.852935471196629, "ground_truth": 0}, {"key": "33981824", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358516173306, "ground_truth": 0}, {"key": "39569142", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8732148299967026, "ground_truth": 0}, {"key": "39569142", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187367784052063, "ground_truth": 0}, {"key": "39569142", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288562015582, "ground_truth": 0}, {"key": "39569142", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578475920683, "ground_truth": 0}, {"key": "39569142", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377672666162, "ground_truth": 0}, {"key": "40268210", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8365545564771983, "ground_truth": 0}, {"key": "40268210", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6723316864752589, "ground_truth": 0}, {"key": "40268210", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8311430583026924, "ground_truth": 0}, {"key": "40268210", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625149222737, "ground_truth": 0}, {"key": "40268210", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339736645307, "ground_truth": 0}, {"key": "34925159", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289387930348692, "ground_truth": 0}, {"key": "34925159", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8104789113991999, "ground_truth": 0}, {"key": "34925159", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6169358535228283, "ground_truth": 0}, {"key": "34925159", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281403432827, "ground_truth": 0}, {"key": "34925159", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9334308079104108, "ground_truth": 0}, {"key": "36181903", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8940517067004705, "ground_truth": 0}, {"key": "36181903", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.849971172609897, "ground_truth": 0}, {"key": "36181903", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.891811034087445, "ground_truth": 0}, {"key": "36181903", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314756874911, "ground_truth": 0}, {"key": "36181903", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218446942888, "ground_truth": 0}, {"key": "38620559", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8519528163972309, "ground_truth": 0}, {"key": "38620559", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8824278754424498, "ground_truth": 0}, {"key": "38620559", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8824278595250695, "ground_truth": 0}, {"key": "38620559", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677592206862, "ground_truth": 0}, {"key": "38620559", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377767559953, "ground_truth": 0}, {"key": "32719657", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7025300374846212, "ground_truth": 0}, {"key": "32719657", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.844921510290325, "ground_truth": 0}, {"key": "32719657", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8164063763920995, "ground_truth": 0}, {"key": "32719657", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388179089426, "ground_truth": 0}, {"key": "32719657", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835283129282, "ground_truth": 0}, {"key": "37530914", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.68930559656951, "ground_truth": 0}, {"key": "37530914", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6442251050467749, "ground_truth": 0}, {"key": "37530914", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.558326982045262, "ground_truth": 0}, {"key": "37530914", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336867622383, "ground_truth": 0}, {"key": "37530914", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876300199180975, "ground_truth": 0}, {"key": "33306933", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8933093937472155, "ground_truth": 0}, {"key": "33306933", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942276108711, "ground_truth": 0}, {"key": "33306933", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9155072514389351, "ground_truth": 0}, {"key": "33306933", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952865154137, "ground_truth": 0}, {"key": "33306933", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673202905798, "ground_truth": 0}, {"key": "33837212", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8267117781083284, "ground_truth": 0}, {"key": "33837212", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7534666629489197, "ground_truth": 0}, {"key": "33837212", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8998277840185916, "ground_truth": 0}, {"key": "33837212", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382127970038, "ground_truth": 0}, {"key": "33837212", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.800691999997406, "ground_truth": 0}, {"key": "40945179", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9105454024656011, "ground_truth": 0}, {"key": "40945179", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8044059162969186, "ground_truth": 0}, {"key": "40945179", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9207896760252182, "ground_truth": 0}, {"key": "40945179", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675255014645, "ground_truth": 0}, {"key": "40945179", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942062351663, "ground_truth": 0}, {"key": "34152358", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6757646013680361, "ground_truth": 0}, {"key": "34152358", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7025300743127814, "ground_truth": 0}, {"key": "34152358", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5926666015279655, "ground_truth": 0}, {"key": "34152358", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832196874534, "ground_truth": 0}, {"key": "34152358", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253887352873, "ground_truth": 0}, {"key": "34136541", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8864204135828828, "ground_truth": 0}, {"key": "34136541", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.817574492995623, "ground_truth": 0}, {"key": "34136541", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.759225418747441, "ground_truth": 0}, {"key": "34136541", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274090863454, "ground_truth": 0}, {"key": "34136541", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577680972219229, "ground_truth": 0}, {"key": "37469603", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5794004200841208, "ground_truth": 0}, {"key": "37469603", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6076631738781673, "ground_truth": 0}, {"key": "37469603", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7154240019478876, "ground_truth": 0}, {"key": "37469603", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.71859437736365, "ground_truth": 0}, {"key": "37469603", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493277179972, "ground_truth": 0}, {"key": "37353611", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9569571485220989, "ground_truth": 0}, {"key": "37353611", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9385759541644934, "ground_truth": 0}, {"key": "37353611", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8596637517912968, "ground_truth": 0}, {"key": "37353611", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392902732609, "ground_truth": 0}, {"key": "37353611", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391607495867, "ground_truth": 0}, {"key": "37211649", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6424324750854838, "ground_truth": 0}, {"key": "37211649", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6959583375741866, "ground_truth": 0}, {"key": "37211649", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7620701032399865, "ground_truth": 0}, {"key": "37211649", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833745585216, "ground_truth": 0}, {"key": "37211649", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238577449358, "ground_truth": 0}, {"key": "37320976", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6943026691210569, "ground_truth": 0}, {"key": "37320976", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6513548538491789, "ground_truth": 0}, {"key": "37320976", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7401743566468523, "ground_truth": 0}, {"key": "37320976", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059187739668, "ground_truth": 0}, {"key": "37320976", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601724146650204, "ground_truth": 0}, {"key": "34492412", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9304582565048946, "ground_truth": 0}, {"key": "34492412", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8128673186008637, "ground_truth": 0}, {"key": "34492412", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9433475783701026, "ground_truth": 0}, {"key": "34492412", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942068811023, "ground_truth": 0}, {"key": "34492412", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377703535363, "ground_truth": 0}, {"key": "36655016", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9224823524844731, "ground_truth": 0}, {"key": "36655016", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9399133501351334, "ground_truth": 0}, {"key": "36655016", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9407897561013354, "ground_truth": 0}, {"key": "36655016", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9449947126922418, "ground_truth": 0}, {"key": "36655016", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.889528842091909, "ground_truth": 0}, {"key": "35220773", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7248702789713356, "ground_truth": 0}, {"key": "35220773", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.821044116772966, "ground_truth": 0}, {"key": "35220773", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.734119526056194, "ground_truth": 0}, {"key": "35220773", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527567459782, "ground_truth": 0}, {"key": "35220773", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797745882824, "ground_truth": 0}, {"key": "31569808", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490872339748096, "ground_truth": 0}, {"key": "31569808", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6406358768035547, "ground_truth": 0}, {"key": "31569808", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6808786246179188, "ground_truth": 0}, {"key": "31569808", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647689442152, "ground_truth": 0}, {"key": "31569808", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245906156658, "ground_truth": 0}, {"key": "37696256", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8068526213940569, "ground_truth": 0}, {"key": "37696256", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127438542061, "ground_truth": 0}, {"key": "37696256", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8164063850843317, "ground_truth": 0}, {"key": "37696256", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324945677265, "ground_truth": 0}, {"key": "37696256", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701116040483, "ground_truth": 0}, {"key": "36874328", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289388194912461, "ground_truth": 0}, {"key": "36874328", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163756135544, "ground_truth": 0}, {"key": "36874328", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7577943751981556, "ground_truth": 0}, {"key": "36874328", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430586642029, "ground_truth": 0}, {"key": "36874328", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646872220412, "ground_truth": 0}, {"key": "24532377", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7106283191005548, "ground_truth": 0}, {"key": "24532377", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127519082318, "ground_truth": 0}, {"key": "24532377", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772314116311, "ground_truth": 0}, {"key": "24532377", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493230383985, "ground_truth": 0}, {"key": "24532377", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982052612663, "ground_truth": 0}, {"key": "39560618", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.661922869244192, "ground_truth": 0}, {"key": "39560618", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7549149767007297, "ground_truth": 0}, {"key": "39560618", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8344068998873901, "ground_truth": 0}, {"key": "39560618", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544175469744, "ground_truth": 0}, {"key": "39560618", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424426356076, "ground_truth": 0}, {"key": "34922693", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.379378376963638, "ground_truth": 0}, {"key": "34922693", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.3849121216839953, "ground_truth": 0}, {"key": "34922693", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5851011394813757, "ground_truth": 0}, {"key": "34922693", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404167541042776, "ground_truth": 0}, {"key": "34922693", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064610804791, "ground_truth": 0}, {"key": "33629577", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648916118983318, "ground_truth": 0}, {"key": "33629577", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7074047016658623, "ground_truth": 0}, {"key": "33629577", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8278281542861169, "ground_truth": 0}, {"key": "33629577", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647727976602, "ground_truth": 0}, {"key": "33629577", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122958641742, "ground_truth": 0}, {"key": "32284359", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.581303112196778, "ground_truth": 0}, {"key": "32284359", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5544704844051894, "ground_truth": 0}, {"key": "32284359", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.672331698700149, "ground_truth": 0}, {"key": "32284359", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.779992906969569, "ground_truth": 0}, {"key": "32284359", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.754914969705621, "ground_truth": 0}, {"key": "28082962", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7772998716608116, "ground_truth": 0}, {"key": "28082962", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6477982296658342, "ground_truth": 0}, {"key": "28082962", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631408990261, "ground_truth": 0}, {"key": "28082962", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666452399221, "ground_truth": 0}, {"key": "28082962", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.618780427648673, "ground_truth": 0}, {"key": "24796803", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9600626911699035, "ground_truth": 0}, {"key": "24796803", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.952574133360926, "ground_truth": 0}, {"key": "24796803", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9539660998836208, "ground_truth": 0}, {"key": "24796803", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9390248065850121, "ground_truth": 0}, {"key": "24796803", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9092645068269771, "ground_truth": 0}, {"key": "35466150", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6791786897541867, "ground_truth": 0}, {"key": "35466150", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8354835161601057, "ground_truth": 0}, {"key": "35466150", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9481545372471345, "ground_truth": 0}, {"key": "35466150", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425395731469, "ground_truth": 0}, {"key": "35466150", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677686865945, "ground_truth": 0}, {"key": "35754289", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104465276207, "ground_truth": 0}, {"key": "35754289", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7839884621522539, "ground_truth": 0}, {"key": "35754289", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.896251385328267, "ground_truth": 0}, {"key": "35754289", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825914467129, "ground_truth": 0}, {"key": "35754289", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894585774874, "ground_truth": 0}, {"key": "36678662", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.971992478922737, "ground_truth": 0}, {"key": "36678662", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9543079662129982, "ground_truth": 0}, {"key": "36678662", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9092645055097678, "ground_truth": 0}, {"key": "36678662", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037224633338, "ground_truth": 0}, {"key": "36678662", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9543079670503118, "ground_truth": 0}, {"key": "35399671", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.874077240593488, "ground_truth": 0}, {"key": "35399671", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9105453969596076, "ground_truth": 0}, {"key": "35399671", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9092645170170844, "ground_truth": 0}, {"key": "35399671", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297887923495, "ground_truth": 0}, {"key": "35399671", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467649871324, "ground_truth": 0}, {"key": "36888180", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8233284040551112, "ground_truth": 0}, {"key": "36888180", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7325918441539588, "ground_truth": 0}, {"key": "36888180", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8872046012190848, "ground_truth": 0}, {"key": "36888180", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148382544326, "ground_truth": 0}, {"key": "36888180", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392794381445, "ground_truth": 0}, {"key": "28061069", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7549149853759651, "ground_truth": 0}, {"key": "28061069", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754374189142, "ground_truth": 0}, {"key": "28061069", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253804638305, "ground_truth": 0}, {"key": "28061069", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789044282908, "ground_truth": 0}, {"key": "28061069", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303324251286, "ground_truth": 0}, {"key": "22259982", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7634837656769331, "ground_truth": 0}, {"key": "22259982", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7201715110406862, "ground_truth": 0}, {"key": "22259982", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8633916054012609, "ground_truth": 0}, {"key": "22259982", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563349964623, "ground_truth": 0}, {"key": "22259982", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336998079046, "ground_truth": 0}, {"key": "34026805", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.817574472675146, "ground_truth": 0}, {"key": "34026805", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8807970801149605, "ground_truth": 0}, {"key": "34026805", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.771843486737412, "ground_truth": 0}, {"key": "34026805", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254010764041, "ground_truth": 0}, {"key": "34026805", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215244176943, "ground_truth": 0}, {"key": "36713809", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9263037324116872, "ground_truth": 0}, {"key": "36713809", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8910549605886097, "ground_truth": 0}, {"key": "36713809", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9339146200504923, "ground_truth": 0}, {"key": "36713809", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686332328205, "ground_truth": 0}, {"key": "36713809", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9579122687242827, "ground_truth": 0}, {"key": "39726411", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7718435216846576, "ground_truth": 0}, {"key": "39726411", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217432057551455, "ground_truth": 0}, {"key": "39726411", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8068526226998257, "ground_truth": 0}, {"key": "39726411", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.635222442986625, "ground_truth": 0}, {"key": "39726411", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740166280575, "ground_truth": 0}, {"key": "37069841", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.874077233015157, "ground_truth": 0}, {"key": "37069841", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942311912999, "ground_truth": 0}, {"key": "37069841", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8749346315162999, "ground_truth": 0}, {"key": "37069841", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869929581598, "ground_truth": 0}, {"key": "37069841", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632978691776, "ground_truth": 0}, {"key": "38894693", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7416740080166903, "ground_truth": 0}, {"key": "38894693", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6740504844827643, "ground_truth": 0}, {"key": "38894693", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8116760333249168, "ground_truth": 0}, {"key": "38894693", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197835246019, "ground_truth": 0}, {"key": "38894693", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.759225432373861, "ground_truth": 0}, {"key": "33946032", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9643214466882453, "ground_truth": 0}, {"key": "33946032", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9732407134075601, "ground_truth": 0}, {"key": "33946032", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9713473348124773, "ground_truth": 0}, {"key": "33946032", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9252299501781203, "ground_truth": 0}, {"key": "33946032", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9449947133206025, "ground_truth": 0}, {"key": "39035311", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086178961619749, "ground_truth": 0}, {"key": "39035311", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9343951650513963, "ground_truth": 0}, {"key": "39035311", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9661559675919151, "ground_truth": 0}, {"key": "39035311", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9441768615381622, "ground_truth": 0}, {"key": "39035311", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9358173537539896, "ground_truth": 0}, {"key": "27680038", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.535098413762889, "ground_truth": 0}, {"key": "27680038", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6406358920047641, "ground_truth": 0}, {"key": "27680038", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6169358434071466, "ground_truth": 0}, {"key": "27680038", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056190211311, "ground_truth": 0}, {"key": "27680038", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791981933564, "ground_truth": 0}, {"key": "36901907", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163620739156, "ground_truth": 0}, {"key": "36901907", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8615382205894183, "ground_truth": 0}, {"key": "36901907", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956581163847275, "ground_truth": 0}, {"key": "36901907", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701040890216, "ground_truth": 0}, {"key": "36901907", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303390033062, "ground_truth": 0}, {"key": "21530542", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5583269780234855, "ground_truth": 0}, {"key": "21530542", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6477982375072768, "ground_truth": 0}, {"key": "21530542", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5350984328024002, "ground_truth": 0}, {"key": "21530542", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737656923447, "ground_truth": 0}, {"key": "21530542", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787015581165, "ground_truth": 0}, {"key": "38192532", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9485372386751304, "ground_truth": 0}, {"key": "38192532", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9529258209036247, "ground_truth": 0}, {"key": "38192532", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9559813460885361, "ground_truth": 0}, {"key": "38192532", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9575961732393133, "ground_truth": 0}, {"key": "38192532", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9549844683940009, "ground_truth": 0}, {"key": "34102400", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6206216179869529, "ground_truth": 0}, {"key": "34102400", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.359364127809469, "ground_truth": 0}, {"key": "34102400", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7217432028266603, "ground_truth": 0}, {"key": "34102400", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526295534478, "ground_truth": 0}, {"key": "34102400", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102479850204, "ground_truth": 0}, {"key": "36133399", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8529354884549806, "ground_truth": 0}, {"key": "36133399", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8714748523694992, "ground_truth": 0}, {"key": "36133399", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7981867616477519, "ground_truth": 0}, {"key": "36133399", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.877476785856736, "ground_truth": 0}, {"key": "36133399", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159494326229, "ground_truth": 0}, {"key": "34314544", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7446563530404302, "ground_truth": 0}, {"key": "34314544", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7813306265585958, "ground_truth": 0}, {"key": "34314544", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7008947955150749, "ground_truth": 0}, {"key": "34314544", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740301290467, "ground_truth": 0}, {"key": "34314544", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898471203281, "ground_truth": 0}, {"key": "33460074", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8791467647460216, "ground_truth": 0}, {"key": "33460074", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942275108865, "ground_truth": 0}, {"key": "33460074", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8933094156479607, "ground_truth": 0}, {"key": "33460074", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240954655303, "ground_truth": 0}, {"key": "33460074", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923168829709, "ground_truth": 0}, {"key": "36191495", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7201715176072737, "ground_truth": 0}, {"key": "36191495", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7981867691659414, "ground_truth": 0}, {"key": "36191495", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8705972655181521, "ground_truth": 0}, {"key": "36191495", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802208258781, "ground_truth": 0}, {"key": "36191495", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647806720492, "ground_truth": 0}, {"key": "39532668", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9453993911854055, "ground_truth": 0}, {"key": "39532668", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9213576194301958, "ground_truth": 0}, {"key": "39532668", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288461549334, "ground_truth": 0}, {"key": "39532668", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278674002831, "ground_truth": 0}, {"key": "39532668", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583509136386, "ground_truth": 0}, {"key": "20328247", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5869964430061604, "ground_truth": 0}, {"key": "20328247", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5563995655852788, "ground_truth": 0}, {"key": "20328247", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6076631549658708, "ground_truth": 0}, {"key": "20328247", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593464664695, "ground_truth": 0}, {"key": "20328247", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358498439863, "ground_truth": 0}, {"key": "39112675", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.57367841436894, "ground_truth": 0}, {"key": "39112675", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6495786257675322, "ground_truth": 0}, {"key": "39112675", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7490872250891181, "ground_truth": 0}, {"key": "39112675", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.637030778231701, "ground_truth": 0}, {"key": "39112675", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419749421852, "ground_truth": 0}, {"key": "31620300", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6513548667253132, "ground_truth": 0}, {"key": "31620300", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5736784178798106, "ground_truth": 0}, {"key": "31620300", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.638835276286017, "ground_truth": 0}, {"key": "31620300", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321879478578, "ground_truth": 0}, {"key": "31620300", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047006668932, "ground_truth": 0}, {"key": "37518509", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6671476625536237, "ground_truth": 0}, {"key": "37518509", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5312093808677533, "ground_truth": 0}, {"key": "37518509", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5983121981001569, "ground_truth": 0}, {"key": "37518509", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833912151358, "ground_truth": 0}, {"key": "37518509", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786903886755, "ground_truth": 0}, {"key": "35454095", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704647873445213, "ground_truth": 0}, {"key": "35454095", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9230391613389997, "ground_truth": 0}, {"key": "35454095", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8723473699629481, "ground_truth": 0}, {"key": "35454095", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437923649873, "ground_truth": 0}, {"key": "35454095", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311794504517, "ground_truth": 0}, {"key": "38542788", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.953621796740665, "ground_truth": 0}, {"key": "38542788", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9299510404862482, "ground_truth": 0}, {"key": "38542788", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9651191116928985, "ground_truth": 0}, {"key": "38542788", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9742394414858351, "ground_truth": 0}, {"key": "38542788", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9629528308516524, "ground_truth": 0}, {"key": "23944937", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5156199165622611, "ground_truth": 0}, {"key": "23944937", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4921881200548931, "ground_truth": 0}, {"key": "23944937", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5370413957927872, "ground_truth": 0}, {"key": "23944937", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804787189257649, "ground_truth": 0}, {"key": "23944937", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544096332173, "ground_truth": 0}, {"key": "31753944", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5058591127517683, "ground_truth": 0}, {"key": "31753944", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5214711548174316, "ground_truth": 0}, {"key": "31753944", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5794003880587836, "ground_truth": 0}, {"key": "31753944", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299989557769, "ground_truth": 0}, {"key": "31753944", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324880124527, "ground_truth": 0}, {"key": "35527214", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.864310449226615, "ground_truth": 0}, {"key": "35527214", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127578077989, "ground_truth": 0}, {"key": "35527214", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.663668933352534, "ground_truth": 0}, {"key": "35527214", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544376203041, "ground_truth": 0}, {"key": "35527214", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675319194481, "ground_truth": 0}, {"key": "40400404", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9706877677759365, "ground_truth": 0}, {"key": "40400404", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9648551521798587, "ground_truth": 0}, {"key": "40400404", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9759464473878089, "ground_truth": 0}, {"key": "40400404", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9640516734408907, "ground_truth": 0}, {"key": "40400404", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9695556491259503, "ground_truth": 0}, {"key": "21713119", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7446563340642114, "ground_truth": 0}, {"key": "21713119", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7416740109808901, "ground_truth": 0}, {"key": "21713119", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7620700905739303, "ground_truth": 0}, {"key": "21713119", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284032264063, "ground_truth": 0}, {"key": "21713119", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884667473827, "ground_truth": 0}, {"key": "28730678", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802335084009, "ground_truth": 0}, {"key": "28730678", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163677700588, "ground_truth": 0}, {"key": "28730678", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8606036057974419, "ground_truth": 0}, {"key": "28730678", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441153662438, "ground_truth": 0}, {"key": "28730678", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9362850040830437, "ground_truth": 0}, {"key": "36823733", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9246876880740874, "ground_truth": 0}, {"key": "36823733", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8031738030441303, "ground_truth": 0}, {"key": "36823733", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9224823455585371, "ground_truth": 0}, {"key": "36823733", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568123047786645, "ground_truth": 0}, {"key": "36823733", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8933094149218256, "ground_truth": 0}, {"key": "35988862", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6334102294238848, "ground_truth": 0}, {"key": "35988862", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6242935502934814, "ground_truth": 0}, {"key": "35988862", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.781330622295561, "ground_truth": 0}, {"key": "35988862", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241939661362, "ground_truth": 0}, {"key": "35988862", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645699233412, "ground_truth": 0}, {"key": "40499665", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9773707993290203, "ground_truth": 0}, {"key": "40499665", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9473810447065971, "ground_truth": 0}, {"key": "40499665", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9481545326538079, "ground_truth": 0}, {"key": "40499665", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9556514149420446, "ground_truth": 0}, {"key": "40499665", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437138548993, "ground_truth": 0}, {"key": "32829820", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382098746256, "ground_truth": 0}, {"key": "32829820", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7879312118169555, "ground_truth": 0}, {"key": "32829820", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956581102490681, "ground_truth": 0}, {"key": "32829820", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254124722231, "ground_truth": 0}, {"key": "32829820", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916286235355, "ground_truth": 0}, {"key": "20583553", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7025300655995289, "ground_truth": 0}, {"key": "20583553", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5679366136172342, "ground_truth": 0}, {"key": "20583553", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6548947283676948, "ground_truth": 0}, {"key": "20583553", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633154656371524, "ground_truth": 0}, {"key": "20583553", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365471521071, "ground_truth": 0}, {"key": "30501550", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9728307653597342, "ground_truth": 0}, {"key": "30501550", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9600626857070045, "ground_truth": 0}, {"key": "30501550", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9669140233572566, "ground_truth": 0}, {"key": "30501550", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9563089414629637, "ground_truth": 0}, {"key": "30501550", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9773707996087797, "ground_truth": 0}, {"key": "38755897", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6926419779495874, "ground_truth": 0}, {"key": "38755897", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7264255998454636, "ground_truth": 0}, {"key": "38755897", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.868826778354957, "ground_truth": 0}, {"key": "38755897", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789283283712, "ground_truth": 0}, {"key": "38755897", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528126497096, "ground_truth": 0}, {"key": "35507201", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648916280062901, "ground_truth": 0}, {"key": "35507201", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6495786182723121, "ground_truth": 0}, {"key": "35507201", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6242935186728223, "ground_truth": 0}, {"key": "35507201", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631507789397, "ground_truth": 0}, {"key": "35507201", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419967402992, "ground_truth": 0}, {"key": "36453511", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835412615278, "ground_truth": 0}, {"key": "36453511", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8615382104115732, "ground_truth": 0}, {"key": "36453511", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267117878800879, "ground_truth": 0}, {"key": "36453511", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346187445961, "ground_truth": 0}, {"key": "36453511", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277770844793, "ground_truth": 0}, {"key": "38066835", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.875786995048709, "ground_truth": 0}, {"key": "38066835", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8577681039961054, "ground_truth": 0}, {"key": "38066835", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9196425302713919, "ground_truth": 0}, {"key": "38066835", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096160558665, "ground_truth": 0}, {"key": "38066835", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916089336366, "ground_truth": 0}, {"key": "39697181", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6959583055371588, "ground_truth": 0}, {"key": "39697181", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6976089273499669, "ground_truth": 0}, {"key": "39697181", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7201715107992602, "ground_truth": 0}, {"key": "39697181", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837566698042, "ground_truth": 0}, {"key": "39697181", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512033589175, "ground_truth": 0}, {"key": "21820893", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333245958658237, "ground_truth": 0}, {"key": "21820893", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8322366566995067, "ground_truth": 0}, {"key": "21820893", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7918210717052565, "ground_truth": 0}, {"key": "21820893", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891459813578, "ground_truth": 0}, {"key": "21820893", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085955638776, "ground_truth": 0}, {"key": "40519933", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199695720253, "ground_truth": 0}, {"key": "40519933", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581711042757, "ground_truth": 0}, {"key": "40519933", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9207896772929943, "ground_truth": 0}, {"key": "40519933", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920259797937, "ground_truth": 0}, {"key": "40519933", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314802408555, "ground_truth": 0}, {"key": "30446033", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7279754331422594, "ground_truth": 0}, {"key": "30446033", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6723317110571608, "ground_truth": 0}, {"key": "30446033", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.87321482574864, "ground_truth": 0}, {"key": "30446033", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324924522544, "ground_truth": 0}, {"key": "30446033", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666332327219, "ground_truth": 0}, {"key": "40216291", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7918210676741002, "ground_truth": 0}, {"key": "40216291", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8577681074417768, "ground_truth": 0}, {"key": "40216291", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8344068853366713, "ground_truth": 0}, {"key": "40216291", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721992175566, "ground_truth": 0}, {"key": "40216291", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511409988212, "ground_truth": 0}, {"key": "33479118", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7969253734652245, "ground_truth": 0}, {"key": "33479118", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6688802482871954, "ground_truth": 0}, {"key": "33479118", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7534666606158756, "ground_truth": 0}, {"key": "33479118", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563330010192, "ground_truth": 0}, {"key": "33479118", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059153982235, "ground_truth": 0}, {"key": "22297373", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7853085646750644, "ground_truth": 0}, {"key": "22297373", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7295197438641824, "ground_truth": 0}, {"key": "22297373", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6370308293809619, "ground_truth": 0}, {"key": "22297373", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.596433158740702, "ground_truth": 0}, {"key": "22297373", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631741227053, "ground_truth": 0}, {"key": "36463668", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876300137346758, "ground_truth": 0}, {"key": "36463668", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619283665084, "ground_truth": 0}, {"key": "36463668", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.817574473842176, "ground_truth": 0}, {"key": "36463668", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441037323594, "ground_truth": 0}, {"key": "36463668", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672082265534, "ground_truth": 0}, {"key": "35264615", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876299915670072, "ground_truth": 0}, {"key": "35264615", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8006920126444687, "ground_truth": 0}, {"key": "35264615", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6477982327220143, "ground_truth": 0}, {"key": "35264615", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149734352346, "ground_truth": 0}, {"key": "35264615", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740395532434, "ground_truth": 0}, {"key": "39898482", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9130583420483156, "ground_truth": 0}, {"key": "39898482", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9458012688790051, "ground_truth": 0}, {"key": "39898482", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9453993945912463, "ground_truth": 0}, {"key": "39898482", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361721757273, "ground_truth": 0}, {"key": "39898482", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9640516765142322, "ground_truth": 0}, {"key": "37228721", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7892337045399538, "ground_truth": 0}, {"key": "37228721", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8428631623144003, "ground_truth": 0}, {"key": "37228721", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8548846407442815, "ground_truth": 0}, {"key": "37228721", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358318632319, "ground_truth": 0}, {"key": "37228721", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159688412853, "ground_truth": 0}, {"key": "24535799", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.958537727799364, "ground_truth": 0}, {"key": "24535799", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9738443820062479, "ground_truth": 0}, {"key": "24535799", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9367494731818966, "ground_truth": 0}, {"key": "24535799", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9651191151997677, "ground_truth": 0}, {"key": "24535799", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819130931588, "ground_truth": 0}, {"key": "35177759", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256600779714, "ground_truth": 0}, {"key": "35177759", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6808786220270662, "ground_truth": 0}, {"key": "35177759", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7008948225124445, "ground_truth": 0}, {"key": "35177759", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936559363445, "ground_truth": 0}, {"key": "35177759", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840542896761, "ground_truth": 0}, {"key": "34364829", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.763483774977627, "ground_truth": 0}, {"key": "34364829", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7325918288923907, "ground_truth": 0}, {"key": "34364829", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6601723781030036, "ground_truth": 0}, {"key": "34364829", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737183977663, "ground_truth": 0}, {"key": "34364829", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352520986263, "ground_truth": 0}, {"key": "38090732", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.837619963006611, "ground_truth": 0}, {"key": "38090732", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.798186783846011, "ground_truth": 0}, {"key": "38090732", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956581100434831, "ground_truth": 0}, {"key": "38090732", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333245952546728, "ground_truth": 0}, {"key": "38090732", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891444757452, "ground_truth": 0}, {"key": "30651479", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7772998610488211, "ground_truth": 0}, {"key": "30651479", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187368071553116, "ground_truth": 0}, {"key": "30651479", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8887587928455906, "ground_truth": 0}, {"key": "30651479", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846284371137, "ground_truth": 0}, {"key": "30651479", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148270271405, "ground_truth": 0}, {"key": "39380921", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382105275543, "ground_truth": 0}, {"key": "39380921", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8749346196600386, "ground_truth": 0}, {"key": "39380921", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8221891455553183, "ground_truth": 0}, {"key": "39380921", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240866360096, "ground_truth": 0}, {"key": "39380921", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740113547342, "ground_truth": 0}, {"key": "39037490", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5448014068060532, "ground_truth": 0}, {"key": "39037490", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5331544139697985, "ground_truth": 0}, {"key": "39037490", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.4707365831292476, "ground_truth": 0}, {"key": "39037490", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.41300357699926266, "ground_truth": 0}, {"key": "39037490", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995643630523, "ground_truth": 0}, {"key": "35917499", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.838679770864445, "ground_truth": 0}, {"key": "35917499", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.890294225405669, "ground_truth": 0}, {"key": "35917499", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8816149003505299, "ground_truth": 0}, {"key": "35917499", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897257342968, "ground_truth": 0}, {"key": "35917499", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582575516945, "ground_truth": 0}, {"key": "34908073", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7786492950357867, "ground_truth": 0}, {"key": "34908073", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7310585841432741, "ground_truth": 0}, {"key": "34908073", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.789233702328332, "ground_truth": 0}, {"key": "34908073", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916217374052, "ground_truth": 0}, {"key": "34908073", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506641838305, "ground_truth": 0}, {"key": "36344759", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9235923210686037, "ground_truth": 0}, {"key": "36344759", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9111797093405866, "ground_truth": 0}, {"key": "36344759", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9458012714741479, "ground_truth": 0}, {"key": "36344759", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898093160719, "ground_truth": 0}, {"key": "36344759", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632920454669, "ground_truth": 0}, {"key": "39984637", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.778649322430282, "ground_truth": 0}, {"key": "39984637", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6513548480802158, "ground_truth": 0}, {"key": "39984637", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6150878651664067, "ground_truth": 0}, {"key": "39984637", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.533154425564003, "ground_truth": 0}, {"key": "39984637", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269911378306, "ground_truth": 0}, {"key": "17917326", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8732148312999, "ground_truth": 0}, {"key": "17917326", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8872045965849239, "ground_truth": 0}, {"key": "17917326", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9339146224577016, "ground_truth": 0}, {"key": "17917326", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359929619381, "ground_truth": 0}, {"key": "17917326", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672039729245, "ground_truth": 0}, {"key": "32193638", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490871983672817, "ground_truth": 0}, {"key": "32193638", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267117852984053, "ground_truth": 0}, {"key": "32193638", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898651620903, "ground_truth": 0}, {"key": "32193638", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833808941537, "ground_truth": 0}, {"key": "32193638", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382232301014, "ground_truth": 0}, {"key": "34564692", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7041601503825204, "ground_truth": 0}, {"key": "34564692", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7634837811225262, "ground_truth": 0}, {"key": "34564692", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7401743438387369, "ground_truth": 0}, {"key": "34564692", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943848654918, "ground_truth": 0}, {"key": "34564692", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867782787534, "ground_truth": 0}, {"key": "39329284", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9901401450791772, "ground_truth": 0}, {"key": "39329284", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6095241708278346, "ground_truth": 0}, {"key": "39329284", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9874720664430062, "ground_truth": 0}, {"key": "39329284", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9873750508693883, "ground_truth": 0}, {"key": "39329284", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9940428459961194, "ground_truth": 0}, {"key": "37438541", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7185943898769397, "ground_truth": 0}, {"key": "37438541", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6477982292519695, "ground_truth": 0}, {"key": "37438541", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.542863256707588, "ground_truth": 0}, {"key": "37438541", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210822380958, "ground_truth": 0}, {"key": "37438541", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737286580437, "ground_truth": 0}, {"key": "34652757", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9178933757378118, "ground_truth": 0}, {"key": "34652757", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9173026617888947, "ground_truth": 0}, {"key": "34652757", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631453079414, "ground_truth": 0}, {"key": "34652757", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036245705092, "ground_truth": 0}, {"key": "34652757", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9173026588797916, "ground_truth": 0}, {"key": "31361004", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7606506646871988, "ground_truth": 0}, {"key": "31361004", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8233284146957103, "ground_truth": 0}, {"key": "31361004", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8397339601796724, "ground_truth": 0}, {"key": "31361004", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435135806937, "ground_truth": 0}, {"key": "31361004", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9173026722596387, "ground_truth": 0}, {"key": "26150727", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7233094579638258, "ground_truth": 0}, {"key": "26150727", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892337127065162, "ground_truth": 0}, {"key": "26150727", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297746333315156, "ground_truth": 0}, {"key": "26150727", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585891195823, "ground_truth": 0}, {"key": "26150727", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640040181239, "ground_truth": 0}, {"key": "36997402", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.854884634256801, "ground_truth": 0}, {"key": "36997402", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9111797037594794, "ground_truth": 0}, {"key": "36997402", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9142907217860473, "ground_truth": 0}, {"key": "36997402", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823453242773, "ground_truth": 0}, {"key": "36997402", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745128040414, "ground_truth": 0}, {"key": "37430643", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5888891334519315, "ground_truth": 0}, {"key": "37430643", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7074047055911848, "ground_truth": 0}, {"key": "37430643", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6893055851085536, "ground_truth": 0}, {"key": "37430643", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526623007142, "ground_truth": 0}, {"key": "37430643", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321970518379, "ground_truth": 0}, {"key": "36964631", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8539127456090794, "ground_truth": 0}, {"key": "36964631", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.900529784232187, "ground_truth": 0}, {"key": "36964631", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338360871827, "ground_truth": 0}, {"key": "36964631", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528003278543, "ground_truth": 0}, {"key": "36964631", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281595319907, "ground_truth": 0}, {"key": "35502013", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7620701082245268, "ground_truth": 0}, {"key": "35502013", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5907792321843777, "ground_truth": 0}, {"key": "35502013", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898513699638, "ground_truth": 0}, {"key": "35502013", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321995224686, "ground_truth": 0}, {"key": "35502013", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701086638232, "ground_truth": 0}, {"key": "33987664", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187368118685512, "ground_truth": 0}, {"key": "33987664", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9358173634447736, "ground_truth": 0}, {"key": "33987664", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8558511465651407, "ground_truth": 0}, {"key": "33987664", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339816491876, "ground_truth": 0}, {"key": "33987664", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.873214822616405, "ground_truth": 0}, {"key": "35203721", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.622459330487804, "ground_truth": 0}, {"key": "35203721", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6076631754682338, "ground_truth": 0}, {"key": "35203721", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5755880145893136, "ground_truth": 0}, {"key": "35203721", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.769080245420105, "ground_truth": 0}, {"key": "35203721", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525396824390185, "ground_truth": 0}, {"key": "39028348", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8344068983550025, "ground_truth": 0}, {"key": "39028348", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8615382008680273, "ground_truth": 0}, {"key": "39028348", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8244619347726263, "ground_truth": 0}, {"key": "39028348", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672278894114, "ground_truth": 0}, {"key": "39028348", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998805686615, "ground_truth": 0}, {"key": "37459383", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802309808021, "ground_truth": 0}, {"key": "37459383", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473609090728, "ground_truth": 0}, {"key": "37459383", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631475305812, "ground_truth": 0}, {"key": "37459383", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840390938057, "ground_truth": 0}, {"key": "37459383", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127636428046, "ground_truth": 0}, {"key": "34020070", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6959583261482452, "ground_truth": 0}, {"key": "34020070", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7401743721041942, "ground_truth": 0}, {"key": "34020070", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431680214784147, "ground_truth": 0}, {"key": "34020070", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504727249459, "ground_truth": 0}, {"key": "34020070", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.752012572153324, "ground_truth": 0}, {"key": "35176615", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835415789141, "ground_truth": 0}, {"key": "35176615", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840406346649, "ground_truth": 0}, {"key": "35176615", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6842640381818823, "ground_truth": 0}, {"key": "35176615", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.746138965361055, "ground_truth": 0}, {"key": "35176615", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929004920506, "ground_truth": 0}, {"key": "33296389", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445621243054, "ground_truth": 0}, {"key": "33296389", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7676898677390604, "ground_truth": 0}, {"key": "33296389", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631550436902, "ground_truth": 0}, {"key": "33296389", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.796925365707735, "ground_truth": 0}, {"key": "33296389", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897396104808, "ground_truth": 0}, {"key": "35399504", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.920217981761664, "ground_truth": 0}, {"key": "35399504", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9224823409211562, "ground_truth": 0}, {"key": "35399504", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9489172652021095, "ground_truth": 0}, {"key": "35399504", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9348724499101931, "ground_truth": 0}, {"key": "35399504", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9111797087800513, "ground_truth": 0}, {"key": "34807886", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876299925397352, "ground_truth": 0}, {"key": "34807886", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6791787117070822, "ground_truth": 0}, {"key": "34807886", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7185944034272526, "ground_truth": 0}, {"key": "34807886", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321815804117, "ground_truth": 0}, {"key": "34807886", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792101498934, "ground_truth": 0}, {"key": "37629813", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7057850058899866, "ground_truth": 0}, {"key": "37629813", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8459424397297648, "ground_truth": 0}, {"key": "37629813", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059358156382, "ground_truth": 0}, {"key": "37629813", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106283011549974, "ground_truth": 0}, {"key": "37629813", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.746138991498595, "ground_truth": 0}, {"key": "28084389", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.85096470160602, "ground_truth": 0}, {"key": "28084389", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.854884644561828, "ground_truth": 0}, {"key": "28084389", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7786493188201635, "ground_truth": 0}, {"key": "28084389", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619257589143, "ground_truth": 0}, {"key": "28084389", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972681478054, "ground_truth": 0}, {"key": "35391734", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8824278740524131, "ground_truth": 0}, {"key": "35391734", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9678992920303954, "ground_truth": 0}, {"key": "35391734", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9230391664714479, "ground_truth": 0}, {"key": "35391734", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9683812349757659, "ground_truth": 0}, {"key": "35391734", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9582261153967688, "ground_truth": 0}, {"key": "40214591", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8140528055521579, "ground_truth": 0}, {"key": "40214591", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8740772414005107, "ground_truth": 0}, {"key": "40214591", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933331006744, "ground_truth": 0}, {"key": "40214591", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256519496805, "ground_truth": 0}, {"key": "40214591", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757870012805448, "ground_truth": 0}, {"key": "26283171", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.824461936290975, "ground_truth": 0}, {"key": "26283171", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9053222969968414, "ground_truth": 0}, {"key": "26283171", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031738108942084, "ground_truth": 0}, {"key": "26283171", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367824212237, "ground_truth": 0}, {"key": "26283171", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253777361986, "ground_truth": 0}, {"key": "37084030", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7401743243795036, "ground_truth": 0}, {"key": "37084030", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7943849673337534, "ground_truth": 0}, {"key": "37084030", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7401743389112896, "ground_truth": 0}, {"key": "37084030", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581582410403, "ground_truth": 0}, {"key": "37084030", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.713830749597435, "ground_truth": 0}, {"key": "39027295", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.3830641785382247, "ground_truth": 0}, {"key": "39027295", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.41111086048373563, "ground_truth": 0}, {"key": "39027295", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5448013897807795, "ground_truth": 0}, {"key": "39027295", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765012955553, "ground_truth": 0}, {"key": "39027295", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030945875807, "ground_truth": 0}, {"key": "14018647", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6791786979329046, "ground_truth": 0}, {"key": "14018647", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5331543842715608, "ground_truth": 0}, {"key": "14018647", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7106283177793268, "ground_truth": 0}, {"key": "14018647", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033701550633, "ground_truth": 0}, {"key": "14018647", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292634283170454, "ground_truth": 0}, {"key": "37424289", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9500414746232776, "ground_truth": 0}, {"key": "37424289", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9563089367238057, "ground_truth": 0}, {"key": "37424289", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9549844658914998, "ground_truth": 0}, {"key": "37424289", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9693241941518128, "ground_truth": 0}, {"key": "37424289", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9726235105810008, "ground_truth": 0}, {"key": "37498031", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445493585456, "ground_truth": 0}, {"key": "37498031", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8910549613751649, "ground_truth": 0}, {"key": "37498031", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191441234812, "ground_truth": 0}, {"key": "37498031", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.856812292244719, "ground_truth": 0}, {"key": "37498031", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314781738673, "ground_truth": 0}, {"key": "30104095", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9334308168490364, "ground_truth": 0}, {"key": "30104095", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9489172627241247, "ground_truth": 0}, {"key": "30104095", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835421075798, "ground_truth": 0}, {"key": "30104095", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284088027060998, "ground_truth": 0}, {"key": "30104095", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632927846012, "ground_truth": 0}, {"key": "37911407", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9092645128655504, "ground_truth": 0}, {"key": "37911407", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8807970817520546, "ground_truth": 0}, {"key": "37911407", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9372107866738277, "ground_truth": 0}, {"key": "37911407", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9142907282107656, "ground_truth": 0}, {"key": "37911407", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9334308122098663, "ground_truth": 0}, {"key": "39177472", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9032942090440164, "ground_truth": 0}, {"key": "39177472", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9299510370631497, "ground_truth": 0}, {"key": "39177472", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9136765214134591, "ground_truth": 0}, {"key": "39177472", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.869714566857362, "ground_truth": 0}, {"key": "39177472", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9339146240839943, "ground_truth": 0}, {"key": "32325454", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8558511473833635, "ground_truth": 0}, {"key": "32325454", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8499711819754932, "ground_truth": 0}, {"key": "32325454", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8068526135698988, "ground_truth": 0}, {"key": "32325454", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240846058725, "ground_truth": 0}, {"key": "32325454", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333246020893668, "ground_truth": 0}, {"key": "38395319", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7866228152870287, "ground_truth": 0}, {"key": "38395319", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7969253796395936, "ground_truth": 0}, {"key": "38395319", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7534666708974495, "ground_truth": 0}, {"key": "38395319", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303259786006, "ground_truth": 0}, {"key": "38395319", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998852941337, "ground_truth": 0}, {"key": "38235895", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8679338435041537, "ground_truth": 0}, {"key": "38235895", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8697145813245514, "ground_truth": 0}, {"key": "38235895", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059262195433, "ground_truth": 0}, {"key": "38235895", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333245900627855, "ground_truth": 0}, {"key": "38235895", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.86431045798399, "ground_truth": 0}, {"key": "26543267", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666622145231, "ground_truth": 0}, {"key": "26543267", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8221891318686507, "ground_truth": 0}, {"key": "26543267", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.796925379896174, "ground_truth": 0}, {"key": "26543267", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526060378204, "ground_truth": 0}, {"key": "26543267", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321958008538, "ground_truth": 0}, {"key": "39054728", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9834704448817823, "ground_truth": 0}, {"key": "39054728", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9923637841924381, "ground_truth": 0}, {"key": "39054728", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9892648382277186, "ground_truth": 0}, {"key": "39054728", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9753900738494337, "ground_truth": 0}, {"key": "39054728", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9811668683970289, "ground_truth": 0}, {"key": "39158443", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9019206848874369, "ground_truth": 0}, {"key": "39158443", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8459424440101333, "ground_truth": 0}, {"key": "39158443", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8548846298436014, "ground_truth": 0}, {"key": "39158443", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278595664155, "ground_truth": 0}, {"key": "39158443", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.855851143824922, "ground_truth": 0}, {"key": "36254201", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5544704657868934, "ground_truth": 0}, {"key": "36254201", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6566582708514838, "ground_truth": 0}, {"key": "36254201", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6334102517757407, "ground_truth": 0}, {"key": "36254201", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646063892744, "ground_truth": 0}, {"key": "36254201", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241869366222, "ground_truth": 0}, {"key": "23434347", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6636689339327233, "ground_truth": 0}, {"key": "23434347", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5907791930286074, "ground_truth": 0}, {"key": "23434347", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.78530858625485, "ground_truth": 0}, {"key": "23434347", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506536829537, "ground_truth": 0}, {"key": "23434347", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210779795578, "ground_truth": 0}, {"key": "34397620", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6297746077976429, "ground_truth": 0}, {"key": "34397620", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5117166246131155, "ground_truth": 0}, {"key": "34397620", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.48242912228261053, "ground_truth": 0}, {"key": "34397620", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228714670237, "ground_truth": 0}, {"key": "34397620", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241773879603, "ground_truth": 0}, {"key": "34340916", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8766343759703966, "ground_truth": 0}, {"key": "34340916", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7310585752657885, "ground_truth": 0}, {"key": "34340916", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7905303244074506, "ground_truth": 0}, {"key": "34340916", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314739770854, "ground_truth": 0}, {"key": "34340916", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715123568878, "ground_truth": 0}, {"key": "30375089", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7839884730906953, "ground_truth": 0}, {"key": "30375089", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7634837619796491, "ground_truth": 0}, {"key": "30375089", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6039318258920647, "ground_truth": 0}, {"key": "30375089", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251062275789, "ground_truth": 0}, {"key": "30375089", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281528176132, "ground_truth": 0}, {"key": "35807797", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9367494789611149, "ground_truth": 0}, {"key": "35807797", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9019206662525177, "ground_truth": 0}, {"key": "35807797", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9161096136487723, "ground_truth": 0}, {"key": "35807797", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9449947087538569, "ground_truth": 0}, {"key": "35807797", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9257686341458421, "ground_truth": 0}, {"key": "34188172", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6893056402354596, "ground_truth": 0}, {"key": "34188172", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6113819930961408, "ground_truth": 0}, {"key": "34188172", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8984105555490518, "ground_truth": 0}, {"key": "34188172", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563380900849, "ground_truth": 0}, {"key": "34188172", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.567936611980028, "ground_truth": 0}, {"key": "37075567", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8832359925653347, "ground_truth": 0}, {"key": "37075567", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.778649294801803, "ground_truth": 0}, {"key": "37075567", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9329437208231491, "ground_truth": 0}, {"key": "37075567", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891094209288, "ground_truth": 0}, {"key": "37075567", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104598048984, "ground_truth": 0}, {"key": "35559735", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6279512158156154, "ground_truth": 0}, {"key": "35559735", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7634837734959457, "ground_truth": 0}, {"key": "35559735", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431679991075855, "ground_truth": 0}, {"key": "35559735", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339611574196, "ground_truth": 0}, {"key": "35559735", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419696159901, "ground_truth": 0}, {"key": "33005019", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6601723552754625, "ground_truth": 0}, {"key": "33005019", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4980468823557036, "ground_truth": 0}, {"key": "33005019", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8244619247392528, "ground_truth": 0}, {"key": "33005019", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201715105350027, "ground_truth": 0}, {"key": "33005019", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884776401822, "ground_truth": 0}, {"key": "30808252", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9167080709828241, "ground_truth": 0}, {"key": "30808252", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8128673200228677, "ground_truth": 0}, {"key": "30808252", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8128673286193892, "ground_truth": 0}, {"key": "30808252", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339741173369, "ground_truth": 0}, {"key": "30808252", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897167694958, "ground_truth": 0}, {"key": "15159017", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7853085946671914, "ground_truth": 0}, {"key": "15159017", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8469578279276092, "ground_truth": 0}, {"key": "15159017", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7892337061802502, "ground_truth": 0}, {"key": "15159017", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339701636076, "ground_truth": 0}, {"key": "15159017", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673066533932, "ground_truth": 0}, {"key": "24493400", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490872234481699, "ground_truth": 0}, {"key": "24493400", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7563575606034987, "ground_truth": 0}, {"key": "24493400", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7826624902675208, "ground_truth": 0}, {"key": "24493400", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.717011881057352, "ground_truth": 0}, {"key": "24493400", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493163406494, "ground_truth": 0}, {"key": "37791071", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8558511390916785, "ground_truth": 0}, {"key": "37791071", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8816149154924671, "ground_truth": 0}, {"key": "37791071", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9099070185958557, "ground_truth": 0}, {"key": "37791071", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743782682877, "ground_truth": 0}, {"key": "37791071", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511455845333, "ground_truth": 0}, {"key": "33528627", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8783142584943219, "ground_truth": 0}, {"key": "33528627", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187367846968948, "ground_truth": 0}, {"key": "33528627", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8832359919576767, "ground_truth": 0}, {"key": "33528627", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163810677041, "ground_truth": 0}, {"key": "33528627", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748600716006, "ground_truth": 0}, {"key": "39925662", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9511422247879976, "ground_truth": 0}, {"key": "39925662", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9518632287005705, "ground_truth": 0}, {"key": "39925662", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.856812304538902, "ground_truth": 0}, {"key": "39925662", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367830499649, "ground_truth": 0}, {"key": "39925662", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.919063297360159, "ground_truth": 0}, {"key": "29213416", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.753466658680124, "ground_truth": 0}, {"key": "29213416", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528080573118, "ground_truth": 0}, {"key": "29213416", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094904109393, "ground_truth": 0}, {"key": "29213416", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149743607667, "ground_truth": 0}, {"key": "29213416", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884524739681, "ground_truth": 0}, {"key": "34492745", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.4474602827905276, "ground_truth": 0}, {"key": "34492745", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5350984274378127, "ground_truth": 0}, {"key": "34492745", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.48047869320976777, "ground_truth": 0}, {"key": "34492745", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046880079436, "ground_truth": 0}, {"key": "34492745", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740225110699, "ground_truth": 0}, {"key": "34191937", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6601723781603617, "ground_truth": 0}, {"key": "34191937", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4921881259648764, "ground_truth": 0}, {"key": "34191937", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5292633875562954, "ground_truth": 0}, {"key": "34191937", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.709019135809092, "ground_truth": 0}, {"key": "34191937", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737425675908, "ground_truth": 0}, {"key": "34933372", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8548846425275712, "ground_truth": 0}, {"key": "34933372", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.850964711542176, "ground_truth": 0}, {"key": "34933372", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.877476794945374, "ground_truth": 0}, {"key": "34933372", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.884039285650484, "ground_truth": 0}, {"key": "34933372", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096215864469, "ground_truth": 0}, {"key": "38714379", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9458012711427506, "ground_truth": 0}, {"key": "38714379", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9130583369619474, "ground_truth": 0}, {"key": "38714379", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9559813519878247, "ground_truth": 0}, {"key": "38714379", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9441768582713568, "ground_truth": 0}, {"key": "38714379", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9734434285236616, "ground_truth": 0}, {"key": "39220660", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8998277891247489, "ground_truth": 0}, {"key": "39220660", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9324533137291866, "ground_truth": 0}, {"key": "39220660", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9381240137937814, "ground_truth": 0}, {"key": "39220660", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9469902279814374, "ground_truth": 0}, {"key": "39220660", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513674026567, "ground_truth": 0}, {"key": "41028780", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8116760067223473, "ground_truth": 0}, {"key": "41028780", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8140528226954238, "ground_truth": 0}, {"key": "41028780", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159422741047, "ground_truth": 0}, {"key": "41028780", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672120656243, "ground_truth": 0}, {"key": "41028780", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324891267156, "ground_truth": 0}, {"key": "39457108", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5679366219461275, "ground_truth": 0}, {"key": "39457108", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "39457108", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6671476677149563, "ground_truth": 0}, {"key": "39457108", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935196301227, "ground_truth": 0}, {"key": "39457108", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850131846194, "ground_truth": 0}, {"key": "38288018", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.727975437925465, "ground_truth": 0}, {"key": "38288018", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754442137903, "ground_truth": 0}, {"key": "38288018", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.665410550575983, "ground_truth": 0}, {"key": "38288018", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089098680883, "ground_truth": 0}, {"key": "38288018", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512737550372, "ground_truth": 0}, {"key": "40106293", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7325918370308513, "ground_truth": 0}, {"key": "40106293", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5926665975525552, "ground_truth": 0}, {"key": "40106293", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094775482626, "ground_truth": 0}, {"key": "40106293", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943708794886, "ground_truth": 0}, {"key": "40106293", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723771780145, "ground_truth": 0}, {"key": "39948797", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6825737393740348, "ground_truth": 0}, {"key": "39948797", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8210441157328833, "ground_truth": 0}, {"key": "39948797", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6424324900978182, "ground_truth": 0}, {"key": "39948797", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740138893605, "ground_truth": 0}, {"key": "39948797", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159540080713, "ground_truth": 0}, {"key": "31853399", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637485079235, "ground_truth": 0}, {"key": "31853399", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7592253963199379, "ground_truth": 0}, {"key": "31853399", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8596637500544478, "ground_truth": 0}, {"key": "31853399", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840457855595, "ground_truth": 0}, {"key": "31853399", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.877476791221799, "ground_truth": 0}, {"key": "35273252", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8116760310753701, "ground_truth": 0}, {"key": "35273252", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892336962155472, "ground_truth": 0}, {"key": "35273252", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7341195242437475, "ground_truth": 0}, {"key": "35273252", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.781330603835778, "ground_truth": 0}, {"key": "35273252", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646174623823, "ground_truth": 0}, {"key": "37130459", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9532750433799776, "ground_truth": 0}, {"key": "37130459", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9873750505144002, "ground_truth": 0}, {"key": "37130459", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.948917262513784, "ground_truth": 0}, {"key": "37130459", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9600626882820675, "ground_truth": 0}, {"key": "37130459", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9702399043422857, "ground_truth": 0}, {"key": "21734003", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8267118100393712, "ground_truth": 0}, {"key": "21734003", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8289388065561342, "ground_truth": 0}, {"key": "21734003", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289387929824149, "ground_truth": 0}, {"key": "21734003", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228261223649, "ground_truth": 0}, {"key": "21734003", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.740174363229133, "ground_truth": 0}, {"key": "33990737", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.73105856283047, "ground_truth": 0}, {"key": "33990737", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6774740051724121, "ground_truth": 0}, {"key": "33990737", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6495786167328593, "ground_truth": 0}, {"key": "33990737", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094703713159, "ground_truth": 0}, {"key": "33990737", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389974393029, "ground_truth": 0}, {"key": "34559912", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9073122191380588, "ground_truth": 0}, {"key": "34559912", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8322366599264021, "ground_truth": 0}, {"key": "34559912", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367792421041, "ground_truth": 0}, {"key": "34559912", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672250974916, "ground_truth": 0}, {"key": "34559912", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919976067157, "ground_truth": 0}, {"key": "39820439", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.552539679418365, "ground_truth": 0}, {"key": "39820439", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5660185308967334, "ground_truth": 0}, {"key": "39820439", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5621765084908381, "ground_truth": 0}, {"key": "39820439", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291022932868, "ground_truth": 0}, {"key": "39820439", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.583203350406239, "ground_truth": 0}, {"key": "34759328", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744743381895, "ground_truth": 0}, {"key": "34759328", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9489172593613716, "ground_truth": 0}, {"key": "34759328", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377774562793, "ground_truth": 0}, {"key": "34759328", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9246876947447649, "ground_truth": 0}, {"key": "34759328", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816148990487653, "ground_truth": 0}, {"key": "36939137", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.762070110652662, "ground_truth": 0}, {"key": "36939137", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8652240838166037, "ground_truth": 0}, {"key": "36939137", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933329464867, "ground_truth": 0}, {"key": "36939137", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063700818723, "ground_truth": 0}, {"key": "36939137", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835399305166, "ground_truth": 0}, {"key": "35851522", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797654451641, "ground_truth": 0}, {"key": "35851522", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7956581034967369, "ground_truth": 0}, {"key": "35851522", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297745968705951, "ground_truth": 0}, {"key": "35851522", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300621393095, "ground_truth": 0}, {"key": "35851522", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754566173043, "ground_truth": 0}, {"key": "22412782", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7138307414545385, "ground_truth": 0}, {"key": "22412782", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754385162351, "ground_truth": 0}, {"key": "22412782", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7041601443966593, "ground_truth": 0}, {"key": "22412782", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666688350007, "ground_truth": 0}, {"key": "22412782", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046826352393, "ground_truth": 0}, {"key": "38579227", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9173026538217506, "ground_truth": 0}, {"key": "38579227", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.92683528104293, "ground_truth": 0}, {"key": "38579227", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9202179831970756, "ground_truth": 0}, {"key": "38579227", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9420819151603246, "ground_truth": 0}, {"key": "38579227", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765202578001, "ground_truth": 0}, {"key": "37206995", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9005297832966327, "ground_truth": 0}, {"key": "37206995", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8925625277955138, "ground_truth": 0}, {"key": "37206995", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8864204187024993, "ground_truth": 0}, {"key": "37206995", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9314625056786359, "ground_truth": 0}, {"key": "37206995", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036353597786, "ground_truth": 0}, {"key": "38700847", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9465966654431089, "ground_truth": 0}, {"key": "38700847", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9376689608807179, "ground_truth": 0}, {"key": "38700847", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9615338087058578, "ground_truth": 0}, {"key": "38700847", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9722043733261678, "ground_truth": 0}, {"key": "38700847", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9569571496112347, "ground_truth": 0}, {"key": "20246590", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9939024382641107, "ground_truth": 0}, {"key": "20246590", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9950945947791937, "ground_truth": 0}, {"key": "20246590", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9822877012525599, "ground_truth": 0}, {"key": "20246590", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9862576799233185, "ground_truth": 0}, {"key": "20246590", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9790357581261522, "ground_truth": 0}, {"key": "39141360", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7606506661025331, "ground_truth": 0}, {"key": "39141360", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6959583216394405, "ground_truth": 0}, {"key": "39141360", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.746138970043896, "ground_truth": 0}, {"key": "39141360", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306295222495, "ground_truth": 0}, {"key": "39141360", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545664698074, "ground_truth": 0}, {"key": "37906226", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6584174853538713, "ground_truth": 0}, {"key": "37906226", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6370307972434898, "ground_truth": 0}, {"key": "37906226", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.43590152450750796, "ground_truth": 0}, {"key": "37906226", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093569160777, "ground_truth": 0}, {"key": "37906226", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.560252647746277, "ground_truth": 0}, {"key": "16201033", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5621764995531134, "ground_truth": 0}, {"key": "16201033", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7549150073659938, "ground_truth": 0}, {"key": "16201033", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5774953774122571, "ground_truth": 0}, {"key": "16201033", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197856310979, "ground_truth": 0}, {"key": "16201033", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318249846325, "ground_truth": 0}, {"key": "36469022", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7185943983004199, "ground_truth": 0}, {"key": "36469022", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909762640915635, "ground_truth": 0}, {"key": "36469022", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7648916076217891, "ground_truth": 0}, {"key": "36469022", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918411328431, "ground_truth": 0}, {"key": "36469022", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102424660494, "ground_truth": 0}, {"key": "31295270", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7371581417926297, "ground_truth": 0}, {"key": "31295270", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7295197970627413, "ground_truth": 0}, {"key": "31295270", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6132365673509094, "ground_truth": 0}, {"key": "31295270", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.801935829468273, "ground_truth": 0}, {"key": "31295270", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102515304553, "ground_truth": 0}, {"key": "35360689", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7606506484609645, "ground_truth": 0}, {"key": "35360689", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4092207875916167, "ground_truth": 0}, {"key": "35360689", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191208547353, "ground_truth": 0}, {"key": "35360689", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015577285632, "ground_truth": 0}, {"key": "35360689", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512554371604, "ground_truth": 0}, {"key": "29202793", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.771843500591784, "ground_truth": 0}, {"key": "29202793", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.769080229209355, "ground_truth": 0}, {"key": "29202793", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7853085879596677, "ground_truth": 0}, {"key": "29202793", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.828938807819425, "ground_truth": 0}, {"key": "29202793", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715139385736, "ground_truth": 0}, {"key": "35999008", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5370413601924456, "ground_truth": 0}, {"key": "35999008", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6297746080351297, "ground_truth": 0}, {"key": "35999008", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6206216172415705, "ground_truth": 0}, {"key": "35999008", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.43014738016340165, "ground_truth": 0}, {"key": "35999008", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582565698681, "ground_truth": 0}, {"key": "31797119", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8998277745783343, "ground_truth": 0}, {"key": "31797119", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8587185677178691, "ground_truth": 0}, {"key": "31797119", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8955226766946223, "ground_truth": 0}, {"key": "31797119", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9324533095704893, "ground_truth": 0}, {"key": "31797119", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513686306297, "ground_truth": 0}, {"key": "26711893", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163748754776, "ground_truth": 0}, {"key": "26711893", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6619228742270026, "ground_truth": 0}, {"key": "26711893", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006919961012416, "ground_truth": 0}, {"key": "26711893", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199531070896, "ground_truth": 0}, {"key": "26711893", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269257096936, "ground_truth": 0}, {"key": "35348288", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5195213286367228, "ground_truth": 0}, {"key": "35348288", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6150878731562406, "ground_truth": 0}, {"key": "35348288", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.620621596647712, "ground_truth": 0}, {"key": "35348288", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216327536189, "ground_truth": 0}, {"key": "35348288", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990581800011, "ground_truth": 0}, {"key": "38124131", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315942975230984, "ground_truth": 0}, {"key": "38124131", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6370308036456362, "ground_truth": 0}, {"key": "38124131", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7662936490506126, "ground_truth": 0}, {"key": "38124131", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833754128091, "ground_truth": 0}, {"key": "38124131", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956581026734866, "ground_truth": 0}, {"key": "20285901", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445543647617, "ground_truth": 0}, {"key": "20285901", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7310585665822429, "ground_truth": 0}, {"key": "20285901", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8438951007518539, "ground_truth": 0}, {"key": "20285901", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494748759948, "ground_truth": 0}, {"key": "20285901", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.740174351991896, "ground_truth": 0}, {"key": "35633632", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5717666008920786, "ground_truth": 0}, {"key": "35633632", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7461389854209954, "ground_truth": 0}, {"key": "35633632", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7461389993419419, "ground_truth": 0}, {"key": "35633632", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880155010749, "ground_truth": 0}, {"key": "35633632", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306270758305, "ground_truth": 0}, {"key": "10741274", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7341195362611457, "ground_truth": 0}, {"key": "10741274", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6876300083749813, "ground_truth": 0}, {"key": "10741274", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8255897310043888, "ground_truth": 0}, {"key": "10741274", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416739912057294, "ground_truth": 0}, {"key": "10741274", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241844653604, "ground_truth": 0}, {"key": "30605795", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6261241883665749, "ground_truth": 0}, {"key": "30605795", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7401743941234165, "ground_truth": 0}, {"key": "30605795", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7279754769354592, "ground_truth": 0}, {"key": "30605795", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797662534758, "ground_truth": 0}, {"key": "30605795", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.654894713182896, "ground_truth": 0}, {"key": "30539722", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6584175015166287, "ground_truth": 0}, {"key": "30539722", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6352224340895605, "ground_truth": 0}, {"key": "30539722", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5774953801726427, "ground_truth": 0}, {"key": "30539722", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575583936645, "ground_truth": 0}, {"key": "30539722", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432057125238, "ground_truth": 0}, {"key": "18639299", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7371581773359306, "ground_truth": 0}, {"key": "18639299", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6943026762313467, "ground_truth": 0}, {"key": "18639299", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7759445704874669, "ground_truth": 0}, {"key": "18639299", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833988014985, "ground_truth": 0}, {"key": "18639299", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210708444376, "ground_truth": 0}, {"key": "39773552", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9441768562428903, "ground_truth": 0}, {"key": "39773552", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9407897491646209, "ground_truth": 0}, {"key": "39773552", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9376689611156116, "ground_truth": 0}, {"key": "39773552", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9585377270924137, "ground_truth": 0}, {"key": "39773552", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9294404039103717, "ground_truth": 0}, {"key": "34086410", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.697608897638074, "ground_truth": 0}, {"key": "34086410", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.649578639175136, "ground_truth": 0}, {"key": "34086410", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5389831991643638, "ground_truth": 0}, {"key": "34086410", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665964153275, "ground_truth": 0}, {"key": "34086410", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004333075091, "ground_truth": 0}, {"key": "35454652", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7461389969628772, "ground_truth": 0}, {"key": "35454652", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.819893341771403, "ground_truth": 0}, {"key": "35454652", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.637030802426364, "ground_truth": 0}, {"key": "35454652", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197970194277, "ground_truth": 0}, {"key": "35454652", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321875084907, "ground_truth": 0}, {"key": "36158310", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9073122149830517, "ground_truth": 0}, {"key": "36158310", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7106282922107662, "ground_truth": 0}, {"key": "36158310", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8976952992402055, "ground_truth": 0}, {"key": "36158310", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637533918129, "ground_truth": 0}, {"key": "36158310", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274202949357, "ground_truth": 0}, {"key": "35688387", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6095241728549463, "ground_truth": 0}, {"key": "35688387", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.901920676163848, "ground_truth": 0}, {"key": "35688387", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7122321911409965, "ground_truth": 0}, {"key": "35688387", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548553280384, "ground_truth": 0}, {"key": "35688387", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358159765225, "ground_truth": 0}, {"key": "34209292", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7008947999760253, "ground_truth": 0}, {"key": "34209292", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6187804249477303, "ground_truth": 0}, {"key": "34209292", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6757646263591154, "ground_truth": 0}, {"key": "34209292", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786492977933152, "ground_truth": 0}, {"key": "34209292", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300739556338, "ground_truth": 0}, {"key": "25037859", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6095241424869494, "ground_truth": 0}, {"key": "25037859", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6001883660958873, "ground_truth": 0}, {"key": "25037859", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6095241648949971, "ground_truth": 0}, {"key": "25037859", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512216245388, "ground_truth": 0}, {"key": "25037859", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990811556614, "ground_truth": 0}, {"key": "36412121", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9437636546984096, "ground_truth": 0}, {"key": "36412121", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9252299606693694, "ground_truth": 0}, {"key": "36412121", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9507778848472878, "ground_truth": 0}, {"key": "36412121", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9473810444297044, "ground_truth": 0}, {"key": "36412121", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222901971723, "ground_truth": 0}, {"key": "34909172", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7356416521935061, "ground_truth": 0}, {"key": "34909172", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6187804408502001, "ground_truth": 0}, {"key": "34909172", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7799929123102239, "ground_truth": 0}, {"key": "34909172", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336900435794, "ground_truth": 0}, {"key": "34909172", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666450248266, "ground_truth": 0}, {"key": "39011806", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9676556711966953, "ground_truth": 0}, {"key": "39011806", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9658995736656326, "ground_truth": 0}, {"key": "39011806", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9612438051951862, "ground_truth": 0}, {"key": "39011806", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.97220437573133, "ground_truth": 0}, {"key": "39011806", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9709092456777806, "ground_truth": 0}, {"key": "33096163", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835358606987, "ground_truth": 0}, {"key": "33096163", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8019358379010175, "ground_truth": 0}, {"key": "33096163", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.805632182466086, "ground_truth": 0}, {"key": "33096163", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253731280459, "ground_truth": 0}, {"key": "33096163", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506497719178, "ground_truth": 0}, {"key": "38762205", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9572778025839361, "ground_truth": 0}, {"key": "38762205", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9600626844826817, "ground_truth": 0}, {"key": "38762205", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9246877020120804, "ground_truth": 0}, {"key": "38762205", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9458012682175084, "ground_truth": 0}, {"key": "38762205", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9257686333244608, "ground_truth": 0}, {"key": "35519177", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9149009502880417, "ground_truth": 0}, {"key": "35519177", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8577681026054519, "ground_truth": 0}, {"key": "35519177", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9257686347909273, "ground_truth": 0}, {"key": "35519177", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9362850026064736, "ground_truth": 0}, {"key": "35519177", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391742129037, "ground_truth": 0}, {"key": "36192531", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673314487161, "ground_truth": 0}, {"key": "36192531", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909762722307511, "ground_truth": 0}, {"key": "36192531", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6876300061765322, "ground_truth": 0}, {"key": "36192531", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737419818665, "ground_truth": 0}, {"key": "36192531", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312047514065, "ground_truth": 0}, {"key": "33160852", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9780517465035168, "ground_truth": 0}, {"key": "33160852", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9597620573008162, "ground_truth": 0}, {"key": "33160852", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9416541618854268, "ground_truth": 0}, {"key": "33160852", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9795114453202913, "ground_truth": 0}, {"key": "33160852", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9706877671846141, "ground_truth": 0}, {"key": "36312304", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.575588021644439, "ground_truth": 0}, {"key": "36312304", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6495786272868508, "ground_truth": 0}, {"key": "36312304", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.759225415017394, "ground_truth": 0}, {"key": "36312304", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216061976184, "ground_truth": 0}, {"key": "36312304", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947526610126, "ground_truth": 0}, {"key": "33773343", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7662936577291656, "ground_truth": 0}, {"key": "33773343", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8044059233011072, "ground_truth": 0}, {"key": "33773343", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7577943506879274, "ground_truth": 0}, {"key": "33773343", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701048492587, "ground_truth": 0}, {"key": "33773343", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059602526725, "ground_truth": 0}, {"key": "34913320", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7401743579257583, "ground_truth": 0}, {"key": "34913320", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7879312017706649, "ground_truth": 0}, {"key": "34913320", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7264256066466971, "ground_truth": 0}, {"key": "34913320", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601496130399, "ground_truth": 0}, {"key": "34913320", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943803329313, "ground_truth": 0}, {"key": "33784155", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849679718321, "ground_truth": 0}, {"key": "33784155", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8128673180865373, "ground_truth": 0}, {"key": "33784155", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.798186778214579, "ground_truth": 0}, {"key": "33784155", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026594583503, "ground_truth": 0}, {"key": "33784155", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948102253749, "ground_truth": 0}, {"key": "24085062", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9852713860131908, "ground_truth": 0}, {"key": "24085062", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9928231186437431, "ground_truth": 0}, {"key": "24085062", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9715639646499109, "ground_truth": 0}, {"key": "24085062", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.974042645267589, "ground_truth": 0}, {"key": "24085062", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9859363735863679, "ground_truth": 0}, {"key": "33893487", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6424324927468026, "ground_truth": 0}, {"key": "33893487", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4649015836234575, "ground_truth": 0}, {"key": "33893487", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5078118644935509, "ground_truth": 0}, {"key": "33893487", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279511871897222, "ground_truth": 0}, {"key": "33893487", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238353216608, "ground_truth": 0}, {"key": "40913011", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9543079674927716, "ground_truth": 0}, {"key": "40913011", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9241418167749558, "ground_truth": 0}, {"key": "40913011", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9399133484548594, "ground_truth": 0}, {"key": "40913011", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9489172630477993, "ground_truth": 0}, {"key": "40913011", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9481545300306802, "ground_truth": 0}, {"key": "29642545", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6370307953959335, "ground_truth": 0}, {"key": "29642545", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7401743673870357, "ground_truth": 0}, {"key": "29642545", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7401743601109005, "ground_truth": 0}, {"key": "29642545", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624629425838, "ground_truth": 0}, {"key": "29642545", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754282813611, "ground_truth": 0}, {"key": "35969159", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7786493102169159, "ground_truth": 0}, {"key": "35969159", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7620701023916683, "ground_truth": 0}, {"key": "35969159", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7931059593884445, "ground_truth": 0}, {"key": "35969159", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253531334001, "ground_truth": 0}, {"key": "35969159", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601269620951, "ground_truth": 0}, {"key": "37081669", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6334102552289367, "ground_truth": 0}, {"key": "37081669", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7853085905731504, "ground_truth": 0}, {"key": "37081669", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7549149726585082, "ground_truth": 0}, {"key": "37081669", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293656410676, "ground_truth": 0}, {"key": "37081669", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802134169669, "ground_truth": 0}, {"key": "40048022", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8577681044363085, "ground_truth": 0}, {"key": "40048022", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.800692013307032, "ground_truth": 0}, {"key": "40048022", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8397339844577699, "ground_truth": 0}, {"key": "40048022", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920026370068, "ground_truth": 0}, {"key": "40048022", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163517465024, "ground_truth": 0}, {"key": "32884004", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9005297774667923, "ground_truth": 0}, {"key": "32884004", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9407897468355554, "ground_truth": 0}, {"key": "32884004", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9111796968679666, "ground_truth": 0}, {"key": "32884004", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339593477461, "ground_truth": 0}, {"key": "32884004", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545463654369, "ground_truth": 0}, {"key": "39022490", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.854884630897392, "ground_truth": 0}, {"key": "39022490", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.846957839631574, "ground_truth": 0}, {"key": "39022490", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8652240837000356, "ground_truth": 0}, {"key": "39022490", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835314793961, "ground_truth": 0}, {"key": "39022490", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337025532845, "ground_truth": 0}, {"key": "35159385", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8624675465318867, "ground_truth": 0}, {"key": "35159385", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581765669974, "ground_truth": 0}, {"key": "35159385", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056321931758824, "ground_truth": 0}, {"key": "35159385", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835406853539, "ground_truth": 0}, {"key": "35159385", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085714596697, "ground_truth": 0}, {"key": "34363669", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5234203592378909, "ground_truth": 0}, {"key": "34363669", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5292633749053391, "ground_truth": 0}, {"key": "34363669", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7057849949684298, "ground_truth": 0}, {"key": "34363669", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880342591921, "ground_truth": 0}, {"key": "34363669", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216271020986, "ground_truth": 0}, {"key": "36119687", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9648551543218593, "ground_truth": 0}, {"key": "36119687", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9184802400042866, "ground_truth": 0}, {"key": "36119687", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9507778912056692, "ground_truth": 0}, {"key": "36119687", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9485372274782983, "ground_truth": 0}, {"key": "36119687", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9515039937818224, "ground_truth": 0}, {"key": "35217446", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7718434931993007, "ground_truth": 0}, {"key": "35217446", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6825737373733188, "ground_truth": 0}, {"key": "35217446", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.73105857345444, "ground_truth": 0}, {"key": "35217446", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142459301926, "ground_truth": 0}, {"key": "35217446", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282732304059, "ground_truth": 0}, {"key": "39049331", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8624675453432886, "ground_truth": 0}, {"key": "39049331", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840559986555, "ground_truth": 0}, {"key": "39049331", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.798186771741833, "ground_truth": 0}, {"key": "39049331", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.82782814409465, "ground_truth": 0}, {"key": "39049331", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267118022317677, "ground_truth": 0}, {"key": "36472242", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8031737919318438, "ground_truth": 0}, {"key": "36472242", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8933094018276606, "ground_truth": 0}, {"key": "36472242", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.891054945852972, "ground_truth": 0}, {"key": "36472242", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578497616775, "ground_truth": 0}, {"key": "36472242", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357655232588, "ground_truth": 0}, {"key": "31854721", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637537204046, "ground_truth": 0}, {"key": "31854721", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7154240034569761, "ground_truth": 0}, {"key": "31854721", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7853085934207853, "ground_truth": 0}, {"key": "31854721", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046997799134, "ground_truth": 0}, {"key": "31854721", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933309953627, "ground_truth": 0}, {"key": "18725849", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8832359883318068, "ground_truth": 0}, {"key": "18725849", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8128673171088833, "ground_truth": 0}, {"key": "18725849", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7325918044650256, "ground_truth": 0}, {"key": "18725849", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884625530598, "ground_truth": 0}, {"key": "18725849", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382055554952, "ground_truth": 0}, {"key": "36883179", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7106282978994958, "ground_truth": 0}, {"key": "36883179", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6370308009856577, "ground_truth": 0}, {"key": "36883179", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.4668455973137586, "ground_truth": 0}, {"key": "36883179", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238561529508, "ground_truth": 0}, {"key": "36883179", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735151836335, "ground_truth": 0}, {"key": "34266359", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7154239941318247, "ground_truth": 0}, {"key": "34266359", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7577943821521411, "ground_truth": 0}, {"key": "34266359", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8376199525674494, "ground_truth": 0}, {"key": "34266359", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.731058584379137, "ground_truth": 0}, {"key": "34266359", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.752012573451555, "ground_truth": 0}, {"key": "31920289", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7170118937135109, "ground_truth": 0}, {"key": "31920289", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187368058253119, "ground_truth": 0}, {"key": "31920289", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956581124764109, "ground_truth": 0}, {"key": "31920289", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068881521342, "ground_truth": 0}, {"key": "31920289", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849690933253, "ground_truth": 0}, {"key": "36292997", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.823328388936523, "ground_truth": 0}, {"key": "36292997", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6876299936988987, "ground_truth": 0}, {"key": "36292997", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8615382072712798, "ground_truth": 0}, {"key": "36292997", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281662860627, "ground_truth": 0}, {"key": "36292997", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972620940301, "ground_truth": 0}, {"key": "30412533", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8910549578694436, "ground_truth": 0}, {"key": "30412533", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8128673233937084, "ground_truth": 0}, {"key": "30412533", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7994423303464534, "ground_truth": 0}, {"key": "30412533", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884617859313, "ground_truth": 0}, {"key": "30412533", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311867509228, "ground_truth": 0}, {"key": "40433191", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9449947113838948, "ground_truth": 0}, {"key": "40433191", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9059898281669537, "ground_truth": 0}, {"key": "40433191", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9167080782095091, "ground_truth": 0}, {"key": "40433191", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748639253925, "ground_truth": 0}, {"key": "40433191", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671443566708, "ground_truth": 0}, {"key": "34565591", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5945512782515152, "ground_truth": 0}, {"key": "34565591", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6315943189601938, "ground_truth": 0}, {"key": "34565591", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5602526427732119, "ground_truth": 0}, {"key": "34565591", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512003103325, "ground_truth": 0}, {"key": "34565591", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.36840568388829925, "ground_truth": 0}, {"key": "36062480", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086178938126955, "ground_truth": 0}, {"key": "36062480", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9202179917908544, "ground_truth": 0}, {"key": "36062480", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9252299529114008, "ground_truth": 0}, {"key": "36062480", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9525741278485799, "ground_truth": 0}, {"key": "36062480", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391744697028, "ground_truth": 0}, {"key": "37276883", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367899492054, "ground_truth": 0}, {"key": "37276883", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8164063881795239, "ground_truth": 0}, {"key": "37276883", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8397339590130756, "ground_truth": 0}, {"key": "37276883", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976953005386429, "ground_truth": 0}, {"key": "37276883", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637586124698, "ground_truth": 0}, {"key": "38509260", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897429399582, "ground_truth": 0}, {"key": "38509260", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8449215396717485, "ground_truth": 0}, {"key": "38509260", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8807970723543453, "ground_truth": 0}, {"key": "38509260", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511537205807, "ground_truth": 0}, {"key": "38509260", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.894789467836907, "ground_truth": 0}, {"key": "37139607", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9706877695579187, "ground_truth": 0}, {"key": "37139607", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9492946379919115, "ground_truth": 0}, {"key": "37139607", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9643214446214609, "ground_truth": 0}, {"key": "37139607", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9674102580727098, "ground_truth": 0}, {"key": "37139607", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9549844645595128, "ground_truth": 0}, {"key": "37092824", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9569571486964719, "ground_truth": 0}, {"key": "37092824", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9500414747381027, "ground_truth": 0}, {"key": "37092824", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9661559631877037, "ground_truth": 0}, {"key": "37092824", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9588471128849596, "ground_truth": 0}, {"key": "37092824", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923268716355, "ground_truth": 0}, {"key": "32191802", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9284088053990686, "ground_truth": 0}, {"key": "32191802", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8840392798298262, "ground_truth": 0}, {"key": "32191802", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9059898210019366, "ground_truth": 0}, {"key": "32191802", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9324533077571109, "ground_truth": 0}, {"key": "32191802", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942139878082, "ground_truth": 0}, {"key": "39396038", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9343951597614342, "ground_truth": 0}, {"key": "39396038", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9449947154024079, "ground_truth": 0}, {"key": "39396038", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288432624383, "ground_truth": 0}, {"key": "39396038", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.923039166039061, "ground_truth": 0}, {"key": "39396038", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056322032562659, "ground_truth": 0}, {"key": "39076884", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7839884797630147, "ground_truth": 0}, {"key": "39076884", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8661325196524311, "ground_truth": 0}, {"key": "39076884", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7826624693980071, "ground_truth": 0}, {"key": "39076884", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677649663817, "ground_truth": 0}, {"key": "39076884", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624605912641, "ground_truth": 0}, {"key": "27763432", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.392336831392332, "ground_truth": 0}, {"key": "27763432", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.49609384087937997, "ground_truth": 0}, {"key": "27763432", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5389832136980708, "ground_truth": 0}, {"key": "27763432", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907610275439353, "ground_truth": 0}, {"key": "27763432", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368640331235, "ground_truth": 0}, {"key": "37806929", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9669140224976315, "ground_truth": 0}, {"key": "37806929", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9600626820862255, "ground_truth": 0}, {"key": "37806929", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.961821723990437, "ground_truth": 0}, {"key": "37806929", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9637799434040035, "ground_truth": 0}, {"key": "37806929", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9669140230749862, "ground_truth": 0}, {"key": "32334186", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8344068835626629, "ground_truth": 0}, {"key": "32334186", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7310585683106243, "ground_truth": 0}, {"key": "32334186", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7981867783385937, "ground_truth": 0}, {"key": "32334186", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288298031345, "ground_truth": 0}, {"key": "32334186", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159458332359, "ground_truth": 0}, {"key": "36187324", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.849971179859257, "ground_truth": 0}, {"key": "36187324", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9092645130236469, "ground_truth": 0}, {"key": "36187324", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.84594243897786, "ground_truth": 0}, {"key": "36187324", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392849453887, "ground_truth": 0}, {"key": "36187324", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632813090165, "ground_truth": 0}, {"key": "35306009", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.976846587878049, "ground_truth": 0}, {"key": "35306009", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9643214477551479, "ground_truth": 0}, {"key": "35306009", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9715639661806968, "ground_truth": 0}, {"key": "35306009", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.97612916527652, "ground_truth": 0}, {"key": "35306009", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9730365042327904, "ground_truth": 0}, {"key": "39490050", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.4765796571080803, "ground_truth": 0}, {"key": "39490050", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6388352628189599, "ground_truth": 0}, {"key": "39490050", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6039318740046071, "ground_truth": 0}, {"key": "39490050", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.613236575626157, "ground_truth": 0}, {"key": "39490050", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755879985304148, "ground_truth": 0}, {"key": "38072149", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5214711439352245, "ground_truth": 0}, {"key": "38072149", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909763009827888, "ground_truth": 0}, {"key": "38072149", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6926419866665194, "ground_truth": 0}, {"key": "38072149", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646253180273, "ground_truth": 0}, {"key": "38072149", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.640635865520291, "ground_truth": 0}, {"key": "35899689", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7826624875249572, "ground_truth": 0}, {"key": "35899689", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8459424280597845, "ground_truth": 0}, {"key": "35899689", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519528072698461, "ground_truth": 0}, {"key": "35899689", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288427846016, "ground_truth": 0}, {"key": "35899689", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437771459964, "ground_truth": 0}, {"key": "27994518", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7122321889094833, "ground_truth": 0}, {"key": "27994518", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6876299910989204, "ground_truth": 0}, {"key": "27994518", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.808067203817495, "ground_truth": 0}, {"key": "27994518", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581579240809, "ground_truth": 0}, {"key": "27994518", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195310177818, "ground_truth": 0}, {"key": "10615479", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.674050461117248, "ground_truth": 0}, {"key": "10615479", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.611381952672601, "ground_truth": 0}, {"key": "10615479", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7813306276915191, "ground_truth": 0}, {"key": "10615479", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.740174350108763, "ground_truth": 0}, {"key": "10615479", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431990513716, "ground_truth": 0}, {"key": "40186667", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7905303259270829, "ground_truth": 0}, {"key": "40186667", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6757646196205782, "ground_truth": 0}, {"key": "40186667", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8529354863338611, "ground_truth": 0}, {"key": "40186667", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122959987048, "ground_truth": 0}, {"key": "40186667", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441028024974, "ground_truth": 0}, {"key": "38622886", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7799928912141578, "ground_truth": 0}, {"key": "38622886", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6261241401637397, "ground_truth": 0}, {"key": "38622886", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.757794349546285, "ground_truth": 0}, {"key": "38622886", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920051012606, "ground_truth": 0}, {"key": "38622886", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.818736803847398, "ground_truth": 0}, {"key": "40686943", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7025300587660968, "ground_truth": 0}, {"key": "40686943", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8056321868848848, "ground_truth": 0}, {"key": "40686943", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7634837753338459, "ground_truth": 0}, {"key": "40686943", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389892964696, "ground_truth": 0}, {"key": "40686943", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493115317482, "ground_truth": 0}, {"key": "30604567", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9695556524859887, "ground_truth": 0}, {"key": "30604567", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9549844695770684, "ground_truth": 0}, {"key": "30604567", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9656413105674772, "ground_truth": 0}, {"key": "30604567", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9713473294552554, "ground_truth": 0}, {"key": "30604567", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9722043780582256, "ground_truth": 0}, {"key": "35440903", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835273913619, "ground_truth": 0}, {"key": "35440903", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7704647857346126, "ground_truth": 0}, {"key": "35440903", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8558511506991646, "ground_truth": 0}, {"key": "35440903", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388078491372, "ground_truth": 0}, {"key": "35440903", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346150176717, "ground_truth": 0}, {"key": "37219533", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6740504881091003, "ground_truth": 0}, {"key": "37219533", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7248702573995758, "ground_truth": 0}, {"key": "37219533", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5888891466149903, "ground_truth": 0}, {"key": "37219533", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548424784167, "ground_truth": 0}, {"key": "37219533", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.704160153865286, "ground_truth": 0}, {"key": "40178965", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.908617897011008, "ground_truth": 0}, {"key": "40178965", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.905989830307848, "ground_truth": 0}, {"key": "40178965", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8688267840177604, "ground_truth": 0}, {"key": "40178965", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531291375554, "ground_truth": 0}, {"key": "40178965", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671408536326, "ground_truth": 0}, {"key": "13750468", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9053222933103928, "ground_truth": 0}, {"key": "13750468", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9241418186901784, "ground_truth": 0}, {"key": "13750468", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8774767961981284, "ground_truth": 0}, {"key": "13750468", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9376689625260709, "ground_truth": 0}, {"key": "13750468", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510417888054, "ground_truth": 0}, {"key": "17754949", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.658417485789056, "ground_truth": 0}, {"key": "17754949", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5525396808823078, "ground_truth": 0}, {"key": "17754949", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191474934833, "ground_truth": 0}, {"key": "17754949", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241457581252, "ground_truth": 0}, {"key": "17754949", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943898264186, "ground_truth": 0}, {"key": "36675623", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9717790143476703, "ground_truth": 0}, {"key": "36675623", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9722043801999031, "ground_truth": 0}, {"key": "36675623", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9585377281196226, "ground_truth": 0}, {"key": "36675623", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9676556693629679, "ground_truth": 0}, {"key": "36675623", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9640516774399911, "ground_truth": 0}, {"key": "40035440", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9856076643037698, "ground_truth": 0}, {"key": "40035440", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.949669364596475, "ground_truth": 0}, {"key": "40035440", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9669140253764382, "ground_truth": 0}, {"key": "40035440", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9690910383710271, "ground_truth": 0}, {"key": "40035440", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.961821721449207, "ground_truth": 0}, {"key": "37685909", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6671476759530095, "ground_truth": 0}, {"key": "37685909", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6619228656933304, "ground_truth": 0}, {"key": "37685909", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933310993752, "ground_truth": 0}, {"key": "37685909", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740271429169, "ground_truth": 0}, {"key": "37685909", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964227907871, "ground_truth": 0}, {"key": "36938787", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8233284004533521, "ground_truth": 0}, {"key": "36938787", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9130583475462901, "ground_truth": 0}, {"key": "36938787", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9507778828700464, "ground_truth": 0}, {"key": "36938787", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142398498802, "ground_truth": 0}, {"key": "36938787", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.907967143726196, "ground_truth": 0}, {"key": "39398068", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6601723960085242, "ground_truth": 0}, {"key": "39398068", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6001883362369937, "ground_truth": 0}, {"key": "39398068", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7634837570427465, "ground_truth": 0}, {"key": "39398068", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122024000742, "ground_truth": 0}, {"key": "39398068", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159484329234, "ground_truth": 0}, {"key": "39926408", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849604858341, "ground_truth": 0}, {"key": "39926408", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7690802359838528, "ground_truth": 0}, {"key": "39926408", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6548947178302287, "ground_truth": 0}, {"key": "39926408", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.760650661755828, "ground_truth": 0}, {"key": "39926408", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321851887505, "ground_truth": 0}, {"key": "40465336", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9196425312587544, "ground_truth": 0}, {"key": "40465336", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9353465145966732, "ground_truth": 0}, {"key": "40465336", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.929951040071337, "ground_truth": 0}, {"key": "40465336", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9309620698721932, "ground_truth": 0}, {"key": "40465336", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107927458365, "ground_truth": 0}, {"key": "34173549", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.93343080984435, "ground_truth": 0}, {"key": "34173549", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9241418206489239, "ground_truth": 0}, {"key": "34173549", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9246876918640546, "ground_truth": 0}, {"key": "34173549", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9304582575721779, "ground_truth": 0}, {"key": "34173549", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9556514196623539, "ground_truth": 0}, {"key": "33541535", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6825737591922347, "ground_truth": 0}, {"key": "33541535", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7416740170515587, "ground_truth": 0}, {"key": "33541535", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544223111067, "ground_truth": 0}, {"key": "33541535", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494547634933, "ground_truth": 0}, {"key": "33541535", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085903368792, "ground_truth": 0}, {"key": "35685195", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8006920094895781, "ground_truth": 0}, {"key": "35685195", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6740504829636277, "ground_truth": 0}, {"key": "35685195", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056321808149637, "ground_truth": 0}, {"key": "35685195", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085804932812, "ground_truth": 0}, {"key": "35685195", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289387901698447, "ground_truth": 0}, {"key": "28440730", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5813030861538476, "ground_truth": 0}, {"key": "28440730", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6584174858683357, "ground_truth": 0}, {"key": "28440730", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191512909516, "ground_truth": 0}, {"key": "28440730", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020616104126002, "ground_truth": 0}, {"key": "28440730", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891160574599, "ground_truth": 0}, {"key": "38338714", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9740426440108744, "ground_truth": 0}, {"key": "38338714", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9603611586338726, "ground_truth": 0}, {"key": "38338714", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9702399054473241, "ground_truth": 0}, {"key": "38338714", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9658995707184753, "ground_truth": 0}, {"key": "38338714", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9738443795124726, "ground_truth": 0}, {"key": "32191881", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9079671360392124, "ground_truth": 0}, {"key": "32191881", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7905303309418344, "ground_truth": 0}, {"key": "32191881", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8714748664164479, "ground_truth": 0}, {"key": "32191881", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228256176436, "ground_truth": 0}, {"key": "32191881", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122974739185, "ground_truth": 0}, {"key": "37707251", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8791467631888389, "ground_truth": 0}, {"key": "37707251", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9381240193438211, "ground_truth": 0}, {"key": "37707251", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8824278737795139, "ground_truth": 0}, {"key": "37707251", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677584945499, "ground_truth": 0}, {"key": "37707251", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8933093959170374, "ground_truth": 0}, {"key": "40172567", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7892337028549713, "ground_truth": 0}, {"key": "40172567", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5794004173187678, "ground_truth": 0}, {"key": "40172567", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5602526966249214, "ground_truth": 0}, {"key": "40172567", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191246463523, "ground_truth": 0}, {"key": "40172567", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593116139894, "ground_truth": 0}, {"key": "33113255", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704647763929159, "ground_truth": 0}, {"key": "33113255", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.836554574975863, "ground_truth": 0}, {"key": "33113255", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031737818222366, "ground_truth": 0}, {"key": "33113255", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.838679771768357, "ground_truth": 0}, {"key": "33113255", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366385251649, "ground_truth": 0}, {"key": "33022143", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254147335127, "ground_truth": 0}, {"key": "33022143", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6791787073210294, "ground_truth": 0}, {"key": "33022143", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.586996436626761, "ground_truth": 0}, {"key": "33022143", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544144512289, "ground_truth": 0}, {"key": "33022143", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.4785288475696312, "ground_truth": 0}, {"key": "32084473", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9539660976908191, "ground_truth": 0}, {"key": "32084473", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9511422265298831, "ground_truth": 0}, {"key": "32084473", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9485372340861931, "ground_truth": 0}, {"key": "32084473", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9515039972442708, "ground_truth": 0}, {"key": "32084473", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9324533059544888, "ground_truth": 0}, {"key": "40564245", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673151801361, "ground_truth": 0}, {"key": "40564245", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840386662016, "ground_truth": 0}, {"key": "40564245", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.741673997206249, "ground_truth": 0}, {"key": "40564245", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059550194641, "ground_truth": 0}, {"key": "40564245", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.833324590319351, "ground_truth": 0}, {"key": "31717213", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5907791923366434, "ground_truth": 0}, {"key": "31717213", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5869964009061129, "ground_truth": 0}, {"key": "31717213", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159444403763, "ground_truth": 0}, {"key": "31717213", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.756357568399023, "ground_truth": 0}, {"key": "31717213", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254018403787, "ground_truth": 0}, {"key": "34861894", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7813306270980891, "ground_truth": 0}, {"key": "34861894", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159646901203, "ground_truth": 0}, {"key": "34861894", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159443866495, "ground_truth": 0}, {"key": "34861894", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920102631547, "ground_truth": 0}, {"key": "34861894", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461390105646474, "ground_truth": 0}, {"key": "40838760", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9362849973425944, "ground_truth": 0}, {"key": "40838760", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8856314781275056, "ground_truth": 0}, {"key": "40838760", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8577681055596715, "ground_truth": 0}, {"key": "40838760", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339661886143, "ground_truth": 0}, {"key": "40838760", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923154585577, "ground_truth": 0}, {"key": "40044849", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9219218290584951, "ground_truth": 0}, {"key": "40044849", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9032942015244462, "ground_truth": 0}, {"key": "40044849", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9178933718393856, "ground_truth": 0}, {"key": "40044849", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.881614897017622, "ground_truth": 0}, {"key": "40044849", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267913577683, "ground_truth": 0}, {"key": "30296116", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7090191432637335, "ground_truth": 0}, {"key": "30296116", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8031738052469314, "ground_truth": 0}, {"key": "30296116", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7994423258736826, "ground_truth": 0}, {"key": "30296116", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762910930596, "ground_truth": 0}, {"key": "30296116", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956581080108195, "ground_truth": 0}, {"key": "34931360", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7264256193164026, "ground_truth": 0}, {"key": "34931360", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8311430597837993, "ground_truth": 0}, {"key": "34931360", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544178006238, "ground_truth": 0}, {"key": "34931360", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445677442177, "ground_truth": 0}, {"key": "34931360", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581688593111, "ground_truth": 0}, {"key": "18862422", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6671476828998666, "ground_truth": 0}, {"key": "18862422", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7201715167423495, "ground_truth": 0}, {"key": "18862422", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7295197792283944, "ground_truth": 0}, {"key": "18862422", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759833605818, "ground_truth": 0}, {"key": "18862422", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.763483756247725, "ground_truth": 0}, {"key": "36361140", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9462003549073309, "ground_truth": 0}, {"key": "36361140", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9178933667571322, "ground_truth": 0}, {"key": "36361140", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9492946377792802, "ground_truth": 0}, {"key": "36361140", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9640516769326604, "ground_truth": 0}, {"key": "36361140", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012722692973, "ground_truth": 0}, {"key": "39703329", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6601723760767775, "ground_truth": 0}, {"key": "39703329", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159471196975, "ground_truth": 0}, {"key": "39703329", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6601723412840249, "ground_truth": 0}, {"key": "39703329", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030770210184, "ground_truth": 0}, {"key": "39703329", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878658372199, "ground_truth": 0}, {"key": "34033324", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9394706074369044, "ground_truth": 0}, {"key": "34033324", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9178933695393138, "ground_truth": 0}, {"key": "34033324", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8976952912428326, "ground_truth": 0}, {"key": "34033324", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9588471169612733, "ground_truth": 0}, {"key": "34033324", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.940353060955078, "ground_truth": 0}, {"key": "35658862", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9066531199105129, "ground_truth": 0}, {"key": "35658862", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9196425332253032, "ground_truth": 0}, {"key": "35658862", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9046505367451694, "ground_truth": 0}, {"key": "35658862", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445353372222, "ground_truth": 0}, {"key": "35658862", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059098941381, "ground_truth": 0}, {"key": "36092657", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9219218310017808, "ground_truth": 0}, {"key": "36092657", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9273632977987063, "ground_truth": 0}, {"key": "36092657", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9433475727922762, "ground_truth": 0}, {"key": "36092657", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9092645133349458, "ground_truth": 0}, {"key": "36092657", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357558612161, "ground_truth": 0}, {"key": "26333438", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6584174974542011, "ground_truth": 0}, {"key": "26333438", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5717665846476442, "ground_truth": 0}, {"key": "26333438", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7520125687848548, "ground_truth": 0}, {"key": "26333438", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906220225403, "ground_truth": 0}, {"key": "26333438", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736783927483523, "ground_truth": 0}, {"key": "34184963", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5486734852791655, "ground_truth": 0}, {"key": "34184963", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5983121878705664, "ground_truth": 0}, {"key": "34184963", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5813030570182031, "ground_truth": 0}, {"key": "34184963", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525396965876701, "ground_truth": 0}, {"key": "34184963", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746047354092, "ground_truth": 0}, {"key": "35069975", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6442250873281454, "ground_truth": 0}, {"key": "35069975", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6601724103489326, "ground_truth": 0}, {"key": "35069975", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8872045895640187, "ground_truth": 0}, {"key": "35069975", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366255442787, "ground_truth": 0}, {"key": "35069975", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746020714907, "ground_truth": 0}, {"key": "36443950", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5253688265297873, "ground_truth": 0}, {"key": "36443950", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5312093856436793, "ground_truth": 0}, {"key": "36443950", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5926666041914993, "ground_truth": 0}, {"key": "36443950", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224502069277, "ground_truth": 0}, {"key": "36443950", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.575587991474488, "ground_truth": 0}, {"key": "29460858", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575457037386, "ground_truth": 0}, {"key": "29460858", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7074047066708331, "ground_truth": 0}, {"key": "29460858", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431680142622242, "ground_truth": 0}, {"key": "29460858", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437771998846, "ground_truth": 0}, {"key": "29460858", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228369748617, "ground_truth": 0}, {"key": "36155704", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6370308162867047, "ground_truth": 0}, {"key": "36155704", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.70416014850549, "ground_truth": 0}, {"key": "36155704", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7122322042138316, "ground_truth": 0}, {"key": "36155704", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011452069762, "ground_truth": 0}, {"key": "36155704", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754691172008, "ground_truth": 0}, {"key": "37185211", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9059898134725272, "ground_truth": 0}, {"key": "37185211", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840460881113, "ground_truth": 0}, {"key": "37185211", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9381240202631055, "ground_truth": 0}, {"key": "37185211", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840462074209, "ground_truth": 0}, {"key": "37185211", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361690494303, "ground_truth": 0}, {"key": "36454885", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7786493150598625, "ground_truth": 0}, {"key": "36454885", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624620870484, "ground_truth": 0}, {"key": "36454885", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6460137004052003, "ground_truth": 0}, {"key": "36454885", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159576844151, "ground_truth": 0}, {"key": "36454885", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253695494329, "ground_truth": 0}, {"key": "33148906", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6909762887986473, "ground_truth": 0}, {"key": "33148906", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6808786139743885, "ground_truth": 0}, {"key": "33148906", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191327021605, "ground_truth": 0}, {"key": "33148906", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819870666677, "ground_truth": 0}, {"key": "33148906", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759737253319, "ground_truth": 0}, {"key": "18086604", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5964331583172645, "ground_truth": 0}, {"key": "18086604", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7090191378807775, "ground_truth": 0}, {"key": "18086604", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5389832104795309, "ground_truth": 0}, {"key": "18086604", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175081064076, "ground_truth": 0}, {"key": "18086604", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828340119069435, "ground_truth": 0}, {"key": "33693397", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8233283820982588, "ground_truth": 0}, {"key": "33693397", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7813306547727304, "ground_truth": 0}, {"key": "33693397", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7505527426150387, "ground_truth": 0}, {"key": "33693397", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059349236341, "ground_truth": 0}, {"key": "33693397", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918416284791, "ground_truth": 0}, {"key": "39501530", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5544704705120562, "ground_truth": 0}, {"key": "39501530", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5888891073011787, "ground_truth": 0}, {"key": "39501530", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7057850322542175, "ground_truth": 0}, {"key": "39501530", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593382594142, "ground_truth": 0}, {"key": "39501530", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566583124282818, "ground_truth": 0}, {"key": "30948874", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9241418182844151, "ground_truth": 0}, {"key": "30948874", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8031738020570528, "ground_truth": 0}, {"key": "30948874", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8998277752605179, "ground_truth": 0}, {"key": "30948874", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9429285992490128, "ground_truth": 0}, {"key": "30948874", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9319595809484803, "ground_truth": 0}, {"key": "39410675", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9241418216623811, "ground_truth": 0}, {"key": "39410675", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8116760276753157, "ground_truth": 0}, {"key": "39410675", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7943849641272589, "ground_truth": 0}, {"key": "39410675", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8955226721282669, "ground_truth": 0}, {"key": "39410675", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063813002744, "ground_truth": 0}, {"key": "32903337", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.42632158315471913, "ground_truth": 0}, {"key": "32903337", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.4649015338610398, "ground_truth": 0}, {"key": "32903337", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5660185224746123, "ground_truth": 0}, {"key": "32903337", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943326245421, "ground_truth": 0}, {"key": "32903337", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.577495358396657, "ground_truth": 0}, {"key": "27685132", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490872023303484, "ground_truth": 0}, {"key": "27685132", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7074046948249413, "ground_truth": 0}, {"key": "27685132", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8092759793118977, "ground_truth": 0}, {"key": "27685132", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582649199832, "ground_truth": 0}, {"key": "27685132", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679365672903081, "ground_truth": 0}, {"key": "22791471", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8397339508815508, "ground_truth": 0}, {"key": "22791471", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998706526445, "ground_truth": 0}, {"key": "22791471", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8479677556498256, "ground_truth": 0}, {"key": "22791471", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799929058028862, "ground_truth": 0}, {"key": "22791471", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526185880126, "ground_truth": 0}, {"key": "32292348", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7008948301496466, "ground_truth": 0}, {"key": "32292348", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7310585751170168, "ground_truth": 0}, {"key": "32292348", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7853085719405642, "ground_truth": 0}, {"key": "32292348", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563565422256, "ground_truth": 0}, {"key": "32292348", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419760387074, "ground_truth": 0}, {"key": "20482930", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.819893354667736, "ground_truth": 0}, {"key": "20482930", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7386690773527754, "ground_truth": 0}, {"key": "20482930", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7981867841704965, "ground_truth": 0}, {"key": "20482930", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680253551629, "ground_truth": 0}, {"key": "20482930", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867784655491, "ground_truth": 0}, {"key": "11635754", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7676898362301402, "ground_truth": 0}, {"key": "11635754", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7676898759032079, "ground_truth": 0}, {"key": "11635754", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.816406383759603, "ground_truth": 0}, {"key": "11635754", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.84796775802959, "ground_truth": 0}, {"key": "11635754", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094852282972, "ground_truth": 0}, {"key": "40029096", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6477982213609768, "ground_truth": 0}, {"key": "40029096", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6619228926228664, "ground_truth": 0}, {"key": "40029096", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8365545505038702, "ground_truth": 0}, {"key": "40029096", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217431937824978, "ground_truth": 0}, {"key": "40029096", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.656658254726695, "ground_truth": 0}, {"key": "40414719", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9196425288518362, "ground_truth": 0}, {"key": "40414719", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473837521033, "ground_truth": 0}, {"key": "40414719", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8910549527991888, "ground_truth": 0}, {"key": "40414719", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633915985495141, "ground_truth": 0}, {"key": "40414719", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869863419476, "ground_truth": 0}, {"key": "39537616", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8661325228861108, "ground_truth": 0}, {"key": "39537616", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9039745198081226, "ground_truth": 0}, {"key": "39537616", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835486103968, "ground_truth": 0}, {"key": "39537616", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506509006585, "ground_truth": 0}, {"key": "39537616", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680155228396, "ground_truth": 0}, {"key": "33245830", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7662936337891549, "ground_truth": 0}, {"key": "33245830", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8596637547788244, "ground_truth": 0}, {"key": "33245830", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7122322017814485, "ground_truth": 0}, {"key": "33245830", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299845861236, "ground_truth": 0}, {"key": "33245830", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.723309465687981, "ground_truth": 0}, {"key": "39243601", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8895288475354108, "ground_truth": 0}, {"key": "39243601", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8918110449496272, "ground_truth": 0}, {"key": "39243601", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8766343691933103, "ground_truth": 0}, {"key": "39243601", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204121488847, "ground_truth": 0}, {"key": "39243601", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9376689636050248, "ground_truth": 0}, {"key": "35815905", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7476159595019084, "ground_truth": 0}, {"key": "35815905", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7356416339331978, "ground_truth": 0}, {"key": "35815905", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.735641638340245, "ground_truth": 0}, {"key": "35815905", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307938947006, "ground_truth": 0}, {"key": "35815905", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105654754662, "ground_truth": 0}, {"key": "35260212", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8799743662519468, "ground_truth": 0}, {"key": "35260212", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8606036067808533, "ground_truth": 0}, {"key": "35260212", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338536649998, "ground_truth": 0}, {"key": "35260212", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.85776810787485, "ground_truth": 0}, {"key": "35260212", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104528377847, "ground_truth": 0}, {"key": "39193924", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6352224162236092, "ground_truth": 0}, {"key": "39193924", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7866228297083007, "ground_truth": 0}, {"key": "39193924", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159612063689, "ground_truth": 0}, {"key": "39193924", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878634364988, "ground_truth": 0}, {"key": "39193924", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.552539709356176, "ground_truth": 0}, {"key": "40658569", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575690669226, "ground_truth": 0}, {"key": "40658569", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6132365692683748, "ground_truth": 0}, {"key": "40658569", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307499515921, "ground_truth": 0}, {"key": "40658569", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.747615966795523, "ground_truth": 0}, {"key": "40658569", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849622651895, "ground_truth": 0}, {"key": "33497596", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7839884773962569, "ground_truth": 0}, {"key": "33497596", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8140528114017663, "ground_truth": 0}, {"key": "33497596", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159656205137, "ground_truth": 0}, {"key": "33497596", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195278999271, "ground_truth": 0}, {"key": "33497596", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.825589715945163, "ground_truth": 0}, {"key": "40339241", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797541633916, "ground_truth": 0}, {"key": "40339241", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7853085644635396, "ground_truth": 0}, {"key": "40339241", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6976089526165965, "ground_truth": 0}, {"key": "40339241", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680183405427, "ground_truth": 0}, {"key": "40339241", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647849690139, "ground_truth": 0}, {"key": "31792608", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8116760214237753, "ground_truth": 0}, {"key": "31792608", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333245915361162, "ground_truth": 0}, {"key": "31792608", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031737930138724, "ground_truth": 0}, {"key": "31792608", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047161048754, "ground_truth": 0}, {"key": "31792608", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149894531155, "ground_truth": 0}, {"key": "33132662", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8459424384327418, "ground_truth": 0}, {"key": "33132662", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8031737864649392, "ground_truth": 0}, {"key": "33132662", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7563575549933259, "ground_truth": 0}, {"key": "33132662", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802312239191, "ground_truth": 0}, {"key": "33132662", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195169387302, "ground_truth": 0}, {"key": "37577457", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.670608286478995, "ground_truth": 0}, {"key": "37577457", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.626124175313211, "ground_truth": 0}, {"key": "37577457", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6224593422594802, "ground_truth": 0}, {"key": "37577457", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.615087859398221, "ground_truth": 0}, {"key": "37577457", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878498082429, "ground_truth": 0}, {"key": "38701278", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9566342014756071, "ground_truth": 0}, {"key": "38701278", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9623913617725984, "ground_truth": 0}, {"key": "38701278", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9798226804448641, "ground_truth": 0}, {"key": "38701278", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9507778830105759, "ground_truth": 0}, {"key": "38701278", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9477691416423139, "ground_truth": 0}, {"key": "34570783", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.942928596324115, "ground_truth": 0}, {"key": "34570783", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9603611615254456, "ground_truth": 0}, {"key": "34570783", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9549844739578254, "ground_truth": 0}, {"key": "34570783", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037272068562, "ground_truth": 0}, {"key": "34570783", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9489172639785868, "ground_truth": 0}, {"key": "39064526", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575700127301, "ground_truth": 0}, {"key": "39064526", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7905303198640735, "ground_truth": 0}, {"key": "39064526", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998597923015, "ground_truth": 0}, {"key": "39064526", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526224279005, "ground_truth": 0}, {"key": "39064526", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601280233951, "ground_truth": 0}, {"key": "40741545", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8499711710402285, "ground_truth": 0}, {"key": "40741545", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869864584211, "ground_truth": 0}, {"key": "40741545", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8300437466322399, "ground_truth": 0}, {"key": "40741545", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950995743919, "ground_truth": 0}, {"key": "40741545", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256021641781, "ground_truth": 0}, {"key": "36929751", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9778834097389809, "ground_truth": 0}, {"key": "36929751", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9681411451575176, "ground_truth": 0}, {"key": "36929751", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9681411457916357, "ground_truth": 0}, {"key": "36929751", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9773708001633556, "ground_truth": 0}, {"key": "36929751", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9785492707423386, "ground_truth": 0}, {"key": "23984730", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6169358206661536, "ground_truth": 0}, {"key": "23984730", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6406358636935676, "ground_truth": 0}, {"key": "23984730", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.554470448487344, "ground_truth": 0}, {"key": "23984730", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792102925492, "ground_truth": 0}, {"key": "23984730", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680065695307, "ground_truth": 0}, {"key": "36007415", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8955226791605667, "ground_truth": 0}, {"key": "36007415", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8774767896904438, "ground_truth": 0}, {"key": "36007415", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9111797067153413, "ground_truth": 0}, {"key": "36007415", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110374575602, "ground_truth": 0}, {"key": "36007415", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107898381323, "ground_truth": 0}, {"key": "38875041", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8568122934830379, "ground_truth": 0}, {"key": "38875041", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9304582538004127, "ground_truth": 0}, {"key": "38875041", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8670357571987974, "ground_truth": 0}, {"key": "38875041", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467688188871, "ground_truth": 0}, {"key": "38875041", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517100562476, "ground_truth": 0}]