[{"key": "35232142", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.037326886738750634, "ground_truth": 0}, {"key": "35232142", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09877258952258156, "ground_truth": 0}, {"key": "35232142", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03919512972838465, "ground_truth": 0}, {"key": "35232142", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.051462762782267364, "ground_truth": 0}, {"key": "35232142", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015663648978635224, "ground_truth": 0}, {"key": "40143035", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.060529387948744684, "ground_truth": 0}, {"key": "40143035", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013532148311570163, "ground_truth": 0}, {"key": "40143035", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05399884155133228, "ground_truth": 0}, {"key": "40143035", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06142403930558163, "ground_truth": 0}, {"key": "40143035", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02120611864739245, "ground_truth": 0}, {"key": "35951548", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23934932918073648, "ground_truth": 0}, {"key": "35951548", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19498020858497797, "ground_truth": 0}, {"key": "35951548", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5370413730277129, "ground_truth": 0}, {"key": "35951548", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.35667071194059585, "ground_truth": 0}, {"key": "35951548", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30652705848038553, "ground_truth": 0}, {"key": "36266422", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.030444350644425834, "ground_truth": 0}, {"key": "36266422", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.025371311609783856, "ground_truth": 0}, {"key": "36266422", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012479699488635258, "ground_truth": 0}, {"key": "36266422", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01353214908359092, "ground_truth": 0}, {"key": "36266422", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.007907291932272398, "ground_truth": 0}, {"key": "38826984", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014281933442792013, "ground_truth": 0}, {"key": "38826984", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0038393946543764266, "ground_truth": 0}, {"key": "38826984", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0041662559512210375, "ground_truth": 0}, {"key": "38826984", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.010860331144653946, "ground_truth": 0}, {"key": "38826984", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016529557157340117, "ground_truth": 0}, {"key": "34540833", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12592276490138138, "ground_truth": 0}, {"key": "34540833", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11047114646856912, "ground_truth": 0}, {"key": "34540833", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13028542679936006, "ground_truth": 0}, {"key": "34540833", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2869678767913951, "ground_truth": 0}, {"key": "34540833", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0926877780471695, "ground_truth": 0}, {"key": "20836172", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010328153211074047, "ground_truth": 0}, {"key": "20836172", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07585818272187961, "ground_truth": 0}, {"key": "20836172", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21601151847968253, "ground_truth": 0}, {"key": "20836172", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04401865406875329, "ground_truth": 0}, {"key": "20836172", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0550052850558736, "ground_truth": 0}, {"key": "35932467", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01717670856654831, "ground_truth": 0}, {"key": "35932467", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08093670645615603, "ground_truth": 0}, {"key": "35932467", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04304284946233905, "ground_truth": 0}, {"key": "35932467", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01717670935337754, "ground_truth": 0}, {"key": "35932467", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07107367176675067, "ground_truth": 0}, {"key": "40758845", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.43782351054435925, "ground_truth": 0}, {"key": "40758845", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.217337517514186, "ground_truth": 0}, {"key": "40758845", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27669053203352795, "ground_truth": 0}, {"key": "40758845", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181322409473243, "ground_truth": 0}, {"key": "40758845", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3684057112178262, "ground_truth": 0}, {"key": "30358490", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09041372625130827, "ground_truth": 0}, {"key": "30358490", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03663136855827744, "ground_truth": 0}, {"key": "30358490", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.029201291094657245, "ground_truth": 0}, {"key": "30358490", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06560483436847629, "ground_truth": 0}, {"key": "30358490", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.045862665001263875, "ground_truth": 0}, {"key": "34615665", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.28937168866589463, "ground_truth": 0}, {"key": "34615665", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2798284979092653, "ground_truth": 0}, {"key": "34615665", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08093671307763353, "ground_truth": 0}, {"key": "34615665", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925953190305847, "ground_truth": 0}, {"key": "34615665", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1338674900006356, "ground_truth": 0}, {"key": "35890902", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.224055463742082, "ground_truth": 0}, {"key": "35890902", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04518375341234622, "ground_truth": 0}, {"key": "35890902", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1688569586144883, "ground_truth": 0}, {"key": "35890902", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223189136001216, "ground_truth": 0}, {"key": "35890902", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242553283487284, "ground_truth": 0}, {"key": "37922330", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02527490122243889, "ground_truth": 0}, {"key": "37922330", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.011463797684804922, "ground_truth": 0}, {"key": "37922330", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01665704002766975, "ground_truth": 0}, {"key": "37922330", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.027901378806890368, "ground_truth": 0}, {"key": "37922330", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05986641929252843, "ground_truth": 0}, {"key": "30844962", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05223085486775078, "ground_truth": 0}, {"key": "30844962", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.053799644803221, "ground_truth": 0}, {"key": "30844962", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01214717074150029, "ground_truth": 0}, {"key": "30844962", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449275318563783, "ground_truth": 0}, {"key": "30844962", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.057071398016777214, "ground_truth": 0}, {"key": "36217333", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.007755536972118394, "ground_truth": 0}, {"key": "36217333", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02854415024389174, "ground_truth": 0}, {"key": "36217333", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.016785491487334783, "ground_truth": 0}, {"key": "36217333", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02769025892655435, "ground_truth": 0}, {"key": "36217333", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024516338906131144, "ground_truth": 0}, {"key": "30816523", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13028542001092047, "ground_truth": 0}, {"key": "30816523", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.025565213081894595, "ground_truth": 0}, {"key": "30816523", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.032836955781633245, "ground_truth": 0}, {"key": "30816523", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.023779985185876266, "ground_truth": 0}, {"key": "30816523", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03760863617384613, "ground_truth": 0}, {"key": "38900884", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09203285641604436, "ground_truth": 0}, {"key": "38900884", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03384403420332789, "ground_truth": 0}, {"key": "38900884", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04434858036419091, "ground_truth": 0}, {"key": "38900884", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.038610927485688756, "ground_truth": 0}, {"key": "38900884", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05419872859110519, "ground_truth": 0}, {"key": "13890581", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.055208689261194696, "ground_truth": 0}, {"key": "13890581", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04054073830652746, "ground_truth": 0}, {"key": "13890581", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03435868710447832, "ground_truth": 0}, {"key": "13890581", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.048496002740011694, "ground_truth": 0}, {"key": "13890581", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040389065951083374, "ground_truth": 0}, {"key": "40194700", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12252322069297777, "ground_truth": 0}, {"key": "40194700", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11838510045430356, "ground_truth": 0}, {"key": "40194700", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0832919256034545, "ground_truth": 0}, {"key": "40194700", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091975431253398, "ground_truth": 0}, {"key": "40194700", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05770531774937538, "ground_truth": 0}, {"key": "37903647", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11920291947743551, "ground_truth": 0}, {"key": "37903647", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.126785169797754, "ground_truth": 0}, {"key": "37903647", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08632347773419143, "ground_truth": 0}, {"key": "37903647", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19072402353931103, "ground_truth": 0}, {"key": "37903647", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.045352579545908316, "ground_truth": 0}, {"key": "13291223", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11008787829766015, "ground_truth": 0}, {"key": "13291223", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10856642041236449, "ground_truth": 0}, {"key": "13291223", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03832197436664183, "ground_truth": 0}, {"key": "13291223", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07211219870551401, "ground_truth": 0}, {"key": "13291223", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06903792443557354, "ground_truth": 0}, {"key": "36052570", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.020804490453850993, "ground_truth": 0}, {"key": "36052570", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.022201228745653393, "ground_truth": 0}, {"key": "36052570", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.00595715430239483, "ground_truth": 0}, {"key": "36052570", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.007149101879858306, "ground_truth": 0}, {"key": "36052570", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.00926801253916337, "ground_truth": 0}, {"key": "34944735", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.488283401914867, "ground_truth": 0}, {"key": "34944735", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6388352841509571, "ground_truth": 0}, {"key": "34944735", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5039061468031868, "ground_truth": 0}, {"key": "34944735", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746181008639, "ground_truth": 0}, {"key": "34944735", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882833863731713, "ground_truth": 0}, {"key": "32159602", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08329192471559256, "ground_truth": 0}, {"key": "32159602", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1250653828930822, "ground_truth": 0}, {"key": "32159602", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08093670791758364, "ground_truth": 0}, {"key": "32159602", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05500528522838562, "ground_truth": 0}, {"key": "32159602", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709430738624, "ground_truth": 0}, {"key": "34988915", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07237402164845724, "ground_truth": 0}, {"key": "34988915", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06441765993947528, "ground_truth": 0}, {"key": "34988915", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10158945021366404, "ground_truth": 0}, {"key": "34988915", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09568693915793113, "ground_truth": 0}, {"key": "34988915", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13296424701686574, "ground_truth": 0}, {"key": "37889203", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06489011596766128, "ground_truth": 0}, {"key": "37889203", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05942821848898168, "ground_truth": 0}, {"key": "37889203", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11676400728947971, "ground_truth": 0}, {"key": "37889203", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06903792789970599, "ground_truth": 0}, {"key": "37889203", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11240508048419094, "ground_truth": 0}, {"key": "33609927", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12506539091705798, "ground_truth": 0}, {"key": "33609927", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1143685222347628, "ground_truth": 0}, {"key": "33609927", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16132023499304304, "ground_truth": 0}, {"key": "33609927", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2094696961314585, "ground_truth": 0}, {"key": "33609927", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13568954002916092, "ground_truth": 0}, {"key": "33578778", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12336561455183256, "ground_truth": 0}, {"key": "33578778", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21206879734472217, "ground_truth": 0}, {"key": "33578778", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09401018590525684, "ground_truth": 0}, {"key": "33578778", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660840655229214, "ground_truth": 0}, {"key": "33578778", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0710736628250857, "ground_truth": 0}, {"key": "36888270", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23934933863935043, "ground_truth": 0}, {"key": "36888270", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06348236166422995, "ground_truth": 0}, {"key": "36888270", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4824291227241148, "ground_truth": 0}, {"key": "36888270", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583986894848385, "ground_truth": 0}, {"key": "36888270", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0821066264424208, "ground_truth": 0}, {"key": "36846007", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08419108279903854, "ground_truth": 0}, {"key": "36846007", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15713685296485727, "ground_truth": 0}, {"key": "36846007", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10194651506240046, "ground_truth": 0}, {"key": "36846007", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132024075173315, "ground_truth": 0}, {"key": "36846007", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2240554574036616, "ground_truth": 0}, {"key": "31723471", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.41111085728435043, "ground_truth": 0}, {"key": "31723471", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16776335686270355, "ground_truth": 0}, {"key": "31723471", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10669060235017316, "ground_truth": 0}, {"key": "31723471", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512972703276967, "ground_truth": 0}, {"key": "31723471", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10970577382900527, "ground_truth": 0}, {"key": "15921828", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7490872044015604, "ground_truth": 0}, {"key": "15921828", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7074046814313577, "ground_truth": 0}, {"key": "15921828", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8749346209768001, "ground_truth": 0}, {"key": "15921828", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575501637579, "ground_truth": 0}, {"key": "15921828", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942139043619, "ground_truth": 0}, {"key": "39109408", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1801066622201663, "ground_truth": 0}, {"key": "39109408", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19930801116986377, "ground_truth": 0}, {"key": "39109408", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3259495207248563, "ground_truth": 0}, {"key": "39109408", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30735802118342587, "ground_truth": 0}, {"key": "39109408", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1895211057985621, "ground_truth": 0}, {"key": "20936833", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07751765840826683, "ground_truth": 0}, {"key": "20936833", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04903962287301818, "ground_truth": 0}, {"key": "20936833", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06560483115866728, "ground_truth": 0}, {"key": "20936833", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10706346206979779, "ground_truth": 0}, {"key": "20936833", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07263671044316079, "ground_truth": 0}, {"key": "36832879", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1465752088608179, "ground_truth": 0}, {"key": "36832879", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27202455592670444, "ground_truth": 0}, {"key": "36832879", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27904197675461423, "ground_truth": 0}, {"key": "36832879", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.32594952439324953, "ground_truth": 0}, {"key": "36832879", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18832397414583604, "ground_truth": 0}, {"key": "14958201", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.38861801672131113, "ground_truth": 0}, {"key": "14958201", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10706346111972838, "ground_truth": 0}, {"key": "14958201", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21733752138284226, "ground_truth": 0}, {"key": "14958201", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2146914066336567, "ground_truth": 0}, {"key": "14958201", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093714519823, "ground_truth": 0}, {"key": "34352262", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09073548525462477, "ground_truth": 0}, {"key": "34352262", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10669060019351863, "ground_truth": 0}, {"key": "34352262", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03461883837663799, "ground_truth": 0}, {"key": "34352262", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159120065744545, "ground_truth": 0}, {"key": "34352262", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.039937318532943564, "ground_truth": 0}, {"key": "39805395", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4843800773054013, "ground_truth": 0}, {"key": "39805395", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09807932711580707, "ground_truth": 0}, {"key": "39805395", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.579400403514883, "ground_truth": 0}, {"key": "39805395", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405756228274348, "ground_truth": 0}, {"key": "39805395", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269743526358, "ground_truth": 0}, {"key": "34303109", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03161876613427398, "ground_truth": 0}, {"key": "34303109", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.021615331026242086, "ground_truth": 0}, {"key": "34303109", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07531230918849269, "ground_truth": 0}, {"key": "34303109", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838510074197733, "ground_truth": 0}, {"key": "34303109", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09773431615858552, "ground_truth": 0}, {"key": "39939090", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11476478518265663, "ground_truth": 0}, {"key": "39939090", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05460060649995866, "ground_truth": 0}, {"key": "39939090", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08601588136475782, "ground_truth": 0}, {"key": "39939090", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11201595726442365, "ground_truth": 0}, {"key": "39939090", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03649376685320795, "ground_truth": 0}, {"key": "29347771", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4016878168361225, "ground_truth": 0}, {"key": "29347771", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5156199061163489, "ground_truth": 0}, {"key": "29347771", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3775406736593649, "ground_truth": 0}, {"key": "29347771", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132651298225657, "ground_truth": 0}, {"key": "29347771", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2173375194830487, "ground_truth": 0}, {"key": "36783415", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.33982764510404284, "ground_truth": 0}, {"key": "36783415", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2254166094853084, "ground_truth": 0}, {"key": "36783415", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.34246158868476473, "ground_truth": 0}, {"key": "36783415", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30902371626328695, "ground_truth": 0}, {"key": "36783415", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16505407222026872, "ground_truth": 0}, {"key": "37935687", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08389038773703122, "ground_truth": 0}, {"key": "37935687", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15405756083103608, "ground_truth": 0}, {"key": "37935687", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1634454411763419, "ground_truth": 0}, {"key": "37935687", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13477591422061222, "ground_truth": 0}, {"key": "37935687", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09138210967872358, "ground_truth": 0}, {"key": "40260829", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14223188267963557, "ground_truth": 0}, {"key": "40260829", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3415824867344301, "ground_truth": 0}, {"key": "40260829", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2674081601271773, "ground_truth": 0}, {"key": "40260829", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1710611839836422, "ground_truth": 0}, {"key": "40260829", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24436301767466884, "ground_truth": 0}, {"key": "36478199", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028870908951231747, "ground_truth": 0}, {"key": "36478199", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.057918084906889225, "ground_truth": 0}, {"key": "36478199", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0381782784347687, "ground_truth": 0}, {"key": "36478199", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05146276705404354, "ground_truth": 0}, {"key": "36478199", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03676946564621271, "ground_truth": 0}, {"key": "34541803", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27825679249847063, "ground_truth": 0}, {"key": "34541803", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13206614578171907, "ground_truth": 0}, {"key": "34541803", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2107662997289951, "ground_truth": 0}, {"key": "34541803", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07949570278464761, "ground_truth": 0}, {"key": "34541803", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18772760133012228, "ground_truth": 0}, {"key": "35360841", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07696083748290469, "ground_truth": 0}, {"key": "35360841", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03138043179352431, "ground_truth": 0}, {"key": "35360841", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0775176579420896, "ground_truth": 0}, {"key": "35360841", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10521053824322919, "ground_truth": 0}, {"key": "35360841", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03732688937496384, "ground_truth": 0}, {"key": "35550407", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.43206338826291574, "ground_truth": 0}, {"key": "35550407", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.39420094393779065, "ground_truth": 0}, {"key": "35550407", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22678362684061928, "ground_truth": 0}, {"key": "35550407", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298811252359374, "ground_truth": 0}, {"key": "35550407", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3140505478389522, "ground_truth": 0}, {"key": "37561590", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07864238080152354, "ground_truth": 0}, {"key": "37561590", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04272219697765112, "ground_truth": 0}, {"key": "37561590", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07978201351737049, "ground_truth": 0}, {"key": "37561590", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07369626833361209, "ground_truth": 0}, {"key": "37561590", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.053799642488335825, "ground_truth": 0}, {"key": "39328843", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.033336823402081786, "ground_truth": 0}, {"key": "39328843", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11201595162886074, "ground_truth": 0}, {"key": "39328843", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22541660549396153, "ground_truth": 0}, {"key": "39328843", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434190801546265, "ground_truth": 0}, {"key": "39328843", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.044680871652906955, "ground_truth": 0}, {"key": "35389665", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7826624894094026, "ground_truth": 0}, {"key": "35389665", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3311197376365279, "ground_truth": 0}, {"key": "35389665", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5506073476485139, "ground_truth": 0}, {"key": "35389665", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33982761772923425, "ground_truth": 0}, {"key": "35389665", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832048512085, "ground_truth": 0}, {"key": "33080187", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08389038532632076, "ground_truth": 0}, {"key": "33080187", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05070536708683103, "ground_truth": 0}, {"key": "33080187", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08632348174318814, "ground_truth": 0}, {"key": "33080187", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09041372804694009, "ground_truth": 0}, {"key": "33080187", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09636510224700014, "ground_truth": 0}, {"key": "38636995", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3504213620057709, "ground_truth": 0}, {"key": "38636995", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18476751399462954, "ground_truth": 0}, {"key": "38636995", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.294214977556835, "ground_truth": 0}, {"key": "38636995", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.368405688358745, "ground_truth": 0}, {"key": "38636995", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473515251319, "ground_truth": 0}, {"key": "18536236", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06008664704212969, "ground_truth": 0}, {"key": "18536236", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020177319853778557, "ground_truth": 0}, {"key": "18536236", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02136888778381226, "ground_truth": 0}, {"key": "18536236", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04369105580298696, "ground_truth": 0}, {"key": "18536236", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04434857912597075, "ground_truth": 0}, {"key": "36289151", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.009161026433601793, "ground_truth": 0}, {"key": "36289151", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.003664220166130116, "ground_truth": 0}, {"key": "36289151", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.023962024004830773, "ground_truth": 0}, {"key": "36289151", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008348054190232518, "ground_truth": 0}, {"key": "36289151", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.004924510585987341, "ground_truth": 0}, {"key": "23017045", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13568954829222205, "ground_truth": 0}, {"key": "23017045", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4244120074272746, "ground_truth": 0}, {"key": "23017045", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3757064747107465, "ground_truth": 0}, {"key": "23017045", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510838962726988, "ground_truth": 0}, {"key": "23017045", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204879048464956, "ground_truth": 0}, {"key": "36418082", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31912139323565175, "ground_truth": 0}, {"key": "36418082", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026759284019713142, "ground_truth": 0}, {"key": "36418082", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25534365640412554, "ground_truth": 0}, {"key": "36418082", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16559312594047257, "ground_truth": 0}, {"key": "36418082", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04304284868934131, "ground_truth": 0}, {"key": "34396551", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027480692196554215, "ground_truth": 0}, {"key": "34396551", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0424038284980659, "ground_truth": 0}, {"key": "34396551", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.039787809891915826, "ground_truth": 0}, {"key": "34396551", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.011869121483459017, "ground_truth": 0}, {"key": "34396551", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01652955668013543, "ground_truth": 0}, {"key": "39720944", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3611647069512758, "ground_truth": 0}, {"key": "39720944", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3056973204087936, "ground_truth": 0}, {"key": "39720944", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0984254234805798, "ground_truth": 0}, {"key": "39720944", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1943678331296772, "ground_truth": 0}, {"key": "39720944", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974732214880907, "ground_truth": 0}, {"key": "35884842", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02696350125415924, "ground_truth": 0}, {"key": "35884842", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.033716537542066105, "ground_truth": 0}, {"key": "35884842", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.052230857110639496, "ground_truth": 0}, {"key": "35884842", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04146227708260997, "ground_truth": 0}, {"key": "35884842", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040845719587314235, "ground_truth": 0}, {"key": "35403375", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10743747194416439, "ground_truth": 0}, {"key": "35403375", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2030746249210797, "ground_truth": 0}, {"key": "35403375", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14903530454054612, "ground_truth": 0}, {"key": "35403375", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07949570433611754, "ground_truth": 0}, {"key": "35403375", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0742313696108052, "ground_truth": 0}, {"key": "26341324", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.044348581324550405, "ground_truth": 0}, {"key": "26341324", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08419107882079692, "ground_truth": 0}, {"key": "26341324", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11357959163017256, "ground_truth": 0}, {"key": "26341324", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08210663033255113, "ground_truth": 0}, {"key": "26341324", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357959219526903, "ground_truth": 0}, {"key": "19212345", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22953521297686327, "ground_truth": 0}, {"key": "19212345", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.059646940055463026, "ground_truth": 0}, {"key": "19212345", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04977344841828043, "ground_truth": 0}, {"key": "19212345", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08509903965428048, "ground_truth": 0}, {"key": "19212345", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12210386349801562, "ground_truth": 0}, {"key": "30548367", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9437636516539784, "ground_truth": 0}, {"key": "30548367", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09203286296596908, "ground_truth": 0}, {"key": "30548367", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8962513748865066, "ground_truth": 0}, {"key": "30548367", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181322084517156, "ground_truth": 0}, {"key": "30548367", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121957881950863, "ground_truth": 0}, {"key": "37919402", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13028542881512684, "ground_truth": 0}, {"key": "37919402", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.059210252081368354, "ground_truth": 0}, {"key": "37919402", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07423136846063744, "ground_truth": 0}, {"key": "37919402", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05644402757531837, "ground_truth": 0}, {"key": "37919402", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451645226389244, "ground_truth": 0}, {"key": "39995133", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.29583987320954763, "ground_truth": 0}, {"key": "39995133", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09235979319930096, "ground_truth": 0}, {"key": "39995133", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16885695191493802, "ground_truth": 0}, {"key": "39995133", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208212916881556, "ground_truth": 0}, {"key": "39995133", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2643583717774521, "ground_truth": 0}, {"key": "40249088", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22678362072628977, "ground_truth": 0}, {"key": "40249088", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20817893425551837, "ground_truth": 0}, {"key": "40249088", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20434190548260767, "ground_truth": 0}, {"key": "40249088", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23370634213882527, "ground_truth": 0}, {"key": "40249088", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1812632101099262, "ground_truth": 0}, {"key": "40254388", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22815649809322927, "ground_truth": 0}, {"key": "40254388", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.049958521979100425, "ground_truth": 0}, {"key": "40254388", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1847675107292299, "ground_truth": 0}, {"key": "40254388", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13753246919843143, "ground_truth": 0}, {"key": "40254388", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1294027314439366, "ground_truth": 0}, {"key": "31995230", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07055959473928887, "ground_truth": 0}, {"key": "31995230", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.015603532607541593, "ground_truth": 0}, {"key": "31995230", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04940524564148451, "ground_truth": 0}, {"key": "31995230", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08819004422045022, "ground_truth": 0}, {"key": "31995230", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0697949226037622, "ground_truth": 0}, {"key": "38632129", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.304041679954157, "ground_truth": 0}, {"key": "38632129", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.26894142044035996, "ground_truth": 0}, {"key": "38632129", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5253688068980495, "ground_truth": 0}, {"key": "38632129", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881347805612, "ground_truth": 0}, {"key": "38632129", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523319551025, "ground_truth": 0}, {"key": "35720795", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2643583739625609, "ground_truth": 0}, {"key": "35720795", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.052618951008085654, "ground_truth": 0}, {"key": "35720795", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04958902444838777, "ground_truth": 0}, {"key": "35720795", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660840013041206, "ground_truth": 0}, {"key": "35720795", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12252321778794813, "ground_truth": 0}, {"key": "23906759", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6442251176440379, "ground_truth": 0}, {"key": "23906759", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2094696907400449, "ground_truth": 0}, {"key": "23906759", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3319854525132451, "ground_truth": 0}, {"key": "23906759", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.35846532700788436, "ground_truth": 0}, {"key": "23906759", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2666436220387286, "ground_truth": 0}, {"key": "19410108", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013689477548833122, "ground_truth": 0}, {"key": "19410108", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.044514424702083916, "ground_truth": 0}, {"key": "19410108", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05223085549201345, "ground_truth": 0}, {"key": "19410108", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.026759282063138635, "ground_truth": 0}, {"key": "19410108", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04637820747229184, "ground_truth": 0}, {"key": "30745137", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0503306307613831, "ground_truth": 0}, {"key": "30745137", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09138210784992573, "ground_truth": 0}, {"key": "30745137", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09877258569499839, "ground_truth": 0}, {"key": "30745137", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09009300206768266, "ground_truth": 0}, {"key": "30745137", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469141788530685, "ground_truth": 0}, {"key": "26553115", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15304216233607718, "ground_truth": 0}, {"key": "26553115", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1721718503978724, "ground_truth": 0}, {"key": "26553115", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23231016060205276, "ground_truth": 0}, {"key": "26553115", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133092590932055, "ground_truth": 0}, {"key": "26553115", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786639110075, "ground_truth": 0}, {"key": "37872311", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1233656150078189, "ground_truth": 0}, {"key": "37872311", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03410042726025122, "ground_truth": 0}, {"key": "37872311", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14903530441524024, "ground_truth": 0}, {"key": "37872311", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1097057679265019, "ground_truth": 0}, {"key": "37872311", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328821397622457, "ground_truth": 0}, {"key": "35553131", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1694058772493477, "ground_truth": 0}, {"key": "35553131", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05686155104814653, "ground_truth": 0}, {"key": "35553131", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0713319989515112, "ground_truth": 0}, {"key": "35553131", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07004895906979593, "ground_truth": 0}, {"key": "35553131", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12378868363933396, "ground_truth": 0}, {"key": "39038936", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07211219703599334, "ground_truth": 0}, {"key": "39038936", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1302854239586418, "ground_truth": 0}, {"key": "39038936", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03258974395806347, "ground_truth": 0}, {"key": "39038936", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05300977598363419, "ground_truth": 0}, {"key": "39038936", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2018132357587772, "ground_truth": 0}, {"key": "38735486", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7752646996653486, "ground_truth": 0}, {"key": "38735486", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.759225404038655, "ground_truth": 0}, {"key": "38735486", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8697145733136726, "ground_truth": 0}, {"key": "38735486", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759833361634, "ground_truth": 0}, {"key": "38735486", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637484451611, "ground_truth": 0}, {"key": "17087845", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.008813166977352451, "ground_truth": 0}, {"key": "17087845", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0058653381703324195, "ground_truth": 0}, {"key": "17087845", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.028007519217096776, "ground_truth": 0}, {"key": "17087845", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03032925927529304, "ground_truth": 0}, {"key": "17087845", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03308597635090762, "ground_truth": 0}, {"key": "37443011", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.00902028086833846, "ground_truth": 0}, {"key": "37443011", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019197450610571917, "ground_truth": 0}, {"key": "37443011", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017509556034148097, "ground_truth": 0}, {"key": "37443011", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04385456472454858, "ground_truth": 0}, {"key": "37443011", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02451633793437542, "ground_truth": 0}, {"key": "36855749", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07396337357397498, "ground_truth": 0}, {"key": "36855749", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01363683561517011, "ground_truth": 0}, {"key": "36855749", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.053601142769862595, "ground_truth": 0}, {"key": "36855749", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016529557117382312, "ground_truth": 0}, {"key": "36855749", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.028007520983516093, "ground_truth": 0}, {"key": "35613141", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2991051941659636, "ground_truth": 0}, {"key": "35613141", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4167966494689612, "ground_truth": 0}, {"key": "35613141", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3638728877254683, "ground_truth": 0}, {"key": "35613141", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687309890315926, "ground_truth": 0}, {"key": "35613141", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12294380051256439, "ground_truth": 0}, {"key": "39088847", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1384617913324596, "ground_truth": 0}, {"key": "39088847", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09268777606978618, "ground_truth": 0}, {"key": "39088847", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24508500130001462, "ground_truth": 0}, {"key": "39088847", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181323376768118, "ground_truth": 0}, {"key": "39088847", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455904807469, "ground_truth": 0}, {"key": "33197277", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13523208322303512, "ground_truth": 0}, {"key": "33197277", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09807932642043536, "ground_truth": 0}, {"key": "33197277", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07807816152452236, "ground_truth": 0}, {"key": "33197277", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.149035296292602, "ground_truth": 0}, {"key": "33197277", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08122775619534539, "ground_truth": 0}, {"key": "33815489", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.029647508538116082, "ground_truth": 0}, {"key": "33815489", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1602660391712287, "ground_truth": 0}, {"key": "33815489", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22953520697495366, "ground_truth": 0}, {"key": "33815489", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1789559012648924, "ground_truth": 0}, {"key": "33815489", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09602549767065022, "ground_truth": 0}, {"key": "35862754", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21601153141922164, "ground_truth": 0}, {"key": "35862754", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1147647806642267, "ground_truth": 0}, {"key": "35862754", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10743747383917296, "ground_truth": 0}, {"key": "35862754", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10631886986395876, "ground_truth": 0}, {"key": "35862754", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10266401161111889, "ground_truth": 0}, {"key": "36080615", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06656919061138067, "ground_truth": 0}, {"key": "36080615", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12421300901258672, "ground_truth": 0}, {"key": "36080615", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08882028905647754, "ground_truth": 0}, {"key": "36080615", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1097057739328305, "ground_truth": 0}, {"key": "36080615", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09073548441361153, "ground_truth": 0}, {"key": "22822742", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05300977360214768, "ground_truth": 0}, {"key": "22822742", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13892843174134326, "ground_truth": 0}, {"key": "22822742", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1143685244826662, "ground_truth": 0}, {"key": "22822742", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08632347894898239, "ground_truth": 0}, {"key": "22822742", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04352814060008731, "ground_truth": 0}, {"key": "39747536", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4436004406696918, "ground_truth": 0}, {"key": "39747536", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21601154161883823, "ground_truth": 0}, {"key": "39747536", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4073334205990546, "ground_truth": 0}, {"key": "39747536", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4542300611882454, "ground_truth": 0}, {"key": "39747536", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31658050839435536, "ground_truth": 0}, {"key": "34218396", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06278920791323765, "ground_truth": 0}, {"key": "34218396", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21076629801756455, "ground_truth": 0}, {"key": "34218396", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09739039782758348, "ground_truth": 0}, {"key": "34218396", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735743912160888, "ground_truth": 0}, {"key": "34218396", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07004896131564245, "ground_truth": 0}, {"key": "39150388", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.022977371426496588, "ground_truth": 0}, {"key": "39150388", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1347759175624733, "ground_truth": 0}, {"key": "39150388", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27669053098823204, "ground_truth": 0}, {"key": "39150388", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10970577249689552, "ground_truth": 0}, {"key": "39150388", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17217184789129428, "ground_truth": 0}, {"key": "28765782", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15921740924486014, "ground_truth": 0}, {"key": "28765782", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13432105198118635, "ground_truth": 0}, {"key": "28765782", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04401865298428117, "ground_truth": 0}, {"key": "28765782", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10411241107737211, "ground_truth": 0}, {"key": "28765782", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11516223690909651, "ground_truth": 0}, {"key": "35828022", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04369106037015023, "ground_truth": 0}, {"key": "35828022", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01478540731650266, "ground_truth": 0}, {"key": "35828022", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06142404170047367, "ground_truth": 0}, {"key": "35828022", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03371653755779368, "ground_truth": 0}, {"key": "35828022", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05281402572262167, "ground_truth": 0}, {"key": "27717735", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028980629623912568, "ground_truth": 0}, {"key": "27717735", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08093671601838033, "ground_truth": 0}, {"key": "27717735", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02779562466436495, "ground_truth": 0}, {"key": "27717735", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06233103909066619, "ground_truth": 0}, {"key": "27717735", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0769608405286352, "ground_truth": 0}, {"key": "37977826", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.005934067223433099, "ground_truth": 0}, {"key": "37977826", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0018602985545448938, "ground_truth": 0}, {"key": "37977826", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.007968814508681105, "ground_truth": 0}, {"key": "37977826", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01120121317318306, "ground_truth": 0}, {"key": "37977826", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0073173976019393185, "ground_truth": 0}, {"key": "31768588", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18713268387466067, "ground_truth": 0}, {"key": "31768588", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028436032739482982, "ground_truth": 0}, {"key": "31768588", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13206615317781695, "ground_truth": 0}, {"key": "31768588", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10484335663113171, "ground_truth": 0}, {"key": "31768588", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040999027929994325, "ground_truth": 0}, {"key": "37183351", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.025371313363856455, "ground_truth": 0}, {"key": "37183351", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.062331039615601005, "ground_truth": 0}, {"key": "37183351", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.023065226481937918, "ground_truth": 0}, {"key": "37183351", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.014785407109278514, "ground_truth": 0}, {"key": "37183351", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01812472149240102, "ground_truth": 0}, {"key": "39622090", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13117322410025362, "ground_truth": 0}, {"key": "39622090", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1895210872925902, "ground_truth": 0}, {"key": "39622090", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16026603943463927, "ground_truth": 0}, {"key": "39622090", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25683200407249074, "ground_truth": 0}, {"key": "39622090", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15002882147101254, "ground_truth": 0}, {"key": "39272756", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021948256277574588, "ground_truth": 0}, {"key": "39272756", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03514484583787996, "ground_truth": 0}, {"key": "39272756", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05834583883638209, "ground_truth": 0}, {"key": "39272756", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008577484971089747, "ground_truth": 0}, {"key": "39272756", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.017375664524780763, "ground_truth": 0}, {"key": "32138822", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24220564128857466, "ground_truth": 0}, {"key": "32138822", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04401865513299007, "ground_truth": 0}, {"key": "32138822", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09807932769257297, "ground_truth": 0}, {"key": "32138822", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07640767568021829, "ground_truth": 0}, {"key": "32138822", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.045522005721732484, "ground_truth": 0}, {"key": "31070114", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24364246754153615, "ground_truth": 0}, {"key": "31070114", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3208213055063745, "ground_truth": 0}, {"key": "31070114", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2643583641229343, "ground_truth": 0}, {"key": "31070114", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25982562687492256, "ground_truth": 0}, {"key": "31070114", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16721867108262875, "ground_truth": 0}, {"key": "39652762", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04552200758267782, "ground_truth": 0}, {"key": "39652762", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05399884181526195, "ground_truth": 0}, {"key": "39652762", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04069295496274448, "ground_truth": 0}, {"key": "39652762", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009303948722223987, "ground_truth": 0}, {"key": "39652762", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.045692032045361916, "ground_truth": 0}, {"key": "33258866", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02998650602922531, "ground_truth": 0}, {"key": "33258866", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05500528530798781, "ground_truth": 0}, {"key": "33258866", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02655657383563711, "ground_truth": 0}, {"key": "33258866", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.007937993914110686, "ground_truth": 0}, {"key": "33258866", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012527933281822426, "ground_truth": 0}, {"key": "36962388", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.048496001180961965, "ground_truth": 0}, {"key": "36962388", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.008511302932797078, "ground_truth": 0}, {"key": "36962388", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3090237132835811, "ground_truth": 0}, {"key": "36962388", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06075190685408739, "ground_truth": 0}, {"key": "36962388", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20817893610454846, "ground_truth": 0}, {"key": "32282272", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06371499482914462, "ground_truth": 0}, {"key": "32282272", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.057918088317590655, "ground_truth": 0}, {"key": "32282272", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06325052895859914, "ground_truth": 0}, {"key": "32282272", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08035746490158385, "ground_truth": 0}, {"key": "32282272", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03622005724939646, "ground_truth": 0}, {"key": "36093072", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22815648959424933, "ground_truth": 0}, {"key": "36093072", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11920292541314122, "ground_truth": 0}, {"key": "36093072", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16776335072325807, "ground_truth": 0}, {"key": "36093072", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11797801591459949, "ground_truth": 0}, {"key": "36093072", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344543310865917, "ground_truth": 0}, {"key": "38879972", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03296124458259683, "ground_truth": 0}, {"key": "38879972", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03846619421950986, "ground_truth": 0}, {"key": "38879972", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03832197354922904, "ground_truth": 0}, {"key": "38879972", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04434857813276407, "ground_truth": 0}, {"key": "38879972", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.031618767739626644, "ground_truth": 0}, {"key": "32106473", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.024330189492203048, "ground_truth": 0}, {"key": "32106473", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02010023557264181, "ground_truth": 0}, {"key": "32106473", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.019345104445933743, "ground_truth": 0}, {"key": "32106473", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08725224510432186, "ground_truth": 0}, {"key": "32106473", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05108273641784157, "ground_truth": 0}, {"key": "40415815", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1250653798970731, "ground_truth": 0}, {"key": "40415815", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13846179267942865, "ground_truth": 0}, {"key": "40415815", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.031738592092417785, "ground_truth": 0}, {"key": "40415815", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07613248380790315, "ground_truth": 0}, {"key": "40415815", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11516223581936134, "ground_truth": 0}, {"key": "34581918", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.023599296258414896, "ground_truth": 0}, {"key": "34581918", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06608537816203747, "ground_truth": 0}, {"key": "34581918", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09534945941516049, "ground_truth": 0}, {"key": "34581918", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04023794373220657, "ground_truth": 0}, {"key": "34581918", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.048857781478489626, "ground_truth": 0}, {"key": "33004157", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021615332800887947, "ground_truth": 0}, {"key": "33004157", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02758528276398112, "ground_truth": 0}, {"key": "33004157", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01602914617965969, "ground_truth": 0}, {"key": "33004157", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05460060668549927, "ground_truth": 0}, {"key": "33004157", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03222229662813995, "ground_truth": 0}, {"key": "30334943", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09367800282735486, "ground_truth": 0}, {"key": "30334943", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02377998451577581, "ground_truth": 0}, {"key": "30334943", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.021044566444501107, "ground_truth": 0}, {"key": "30334943", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.007403014311498981, "ground_truth": 0}, {"key": "30334943", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0181247211816573, "ground_truth": 0}, {"key": "33280503", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13206615244321035, "ground_truth": 0}, {"key": "33280503", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3157359797613886, "ground_truth": 0}, {"key": "33280503", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14128140932893518, "ground_truth": 0}, {"key": "33280503", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930800928089887, "ground_truth": 0}, {"key": "33280503", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08601587979997295, "ground_truth": 0}, {"key": "25726782", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027795624031744303, "ground_truth": 0}, {"key": "25726782", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.054399319481643976, "ground_truth": 0}, {"key": "25726782", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10017222020334685, "ground_truth": 0}, {"key": "25726782", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0866320632099644, "ground_truth": 0}, {"key": "25726782", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04240382614737928, "ground_truth": 0}, {"key": "35479854", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14903530582611632, "ground_truth": 0}, {"key": "35479854", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03397199949469881, "ground_truth": 0}, {"key": "35479854", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08479540425382896, "ground_truth": 0}, {"key": "35479854", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0761324815479411, "ground_truth": 0}, {"key": "35479854", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01665704021041689, "ground_truth": 0}, {"key": "32716226", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.051082738346037805, "ground_truth": 0}, {"key": "32716226", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14903529958050088, "ground_truth": 0}, {"key": "32716226", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.044680869071948306, "ground_truth": 0}, {"key": "32716226", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02194825538770488, "ground_truth": 0}, {"key": "32716226", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04501553095567167, "ground_truth": 0}, {"key": "37047554", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19806417252715564, "ground_truth": 0}, {"key": "37047554", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3684057176506134, "ground_truth": 0}, {"key": "37047554", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23651624070261226, "ground_truth": 0}, {"key": "37047554", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2309197456166762, "ground_truth": 0}, {"key": "37047554", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451386186864, "ground_truth": 0}, {"key": "36565290", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2465333532693228, "ground_truth": 0}, {"key": "36565290", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07369627327490215, "ground_truth": 0}, {"key": "36565290", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2011847316703968, "ground_truth": 0}, {"key": "36565290", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13296425146330662, "ground_truth": 0}, {"key": "36565290", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660840075374728, "ground_truth": 0}, {"key": "27758640", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0844927567301197, "ground_truth": 0}, {"key": "27758640", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11397345711125627, "ground_truth": 0}, {"key": "27758640", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010735162703543553, "ground_truth": 0}, {"key": "27758640", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08240150757481848, "ground_truth": 0}, {"key": "27758640", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11436852652762192, "ground_truth": 0}, {"key": "28897118", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3293917066551106, "ground_truth": 0}, {"key": "28897118", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08151975128355872, "ground_truth": 0}, {"key": "28897118", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.39606818415452966, "ground_truth": 0}, {"key": "28897118", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930800952053238, "ground_truth": 0}, {"key": "28897118", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291217859835, "ground_truth": 0}, {"key": "38452661", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7401743541470251, "ground_truth": 0}, {"key": "38452661", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.30902371127794803, "ground_truth": 0}, {"key": "38452661", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.33982763191951626, "ground_truth": 0}, {"key": "38452661", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667539876215773, "ground_truth": 0}, {"key": "38452661", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13206615295612747, "ground_truth": 0}, {"key": "38033492", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0821066279163765, "ground_truth": 0}, {"key": "38033492", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05340333116923799, "ground_truth": 0}, {"key": "38033492", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12506538847021456, "ground_truth": 0}, {"key": "38033492", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06853749466939199, "ground_truth": 0}, {"key": "38033492", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11436852306917146, "ground_truth": 0}, {"key": "35949555", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.008348054179119749, "ground_truth": 0}, {"key": "35949555", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.003403005747088843, "ground_truth": 0}, {"key": "35949555", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.018124720312590718, "ground_truth": 0}, {"key": "35949555", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009303948873978103, "ground_truth": 0}, {"key": "35949555", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.026963501934859323, "ground_truth": 0}, {"key": "15263826", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2829881307485049, "ground_truth": 0}, {"key": "15263826", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09947020711755238, "ground_truth": 0}, {"key": "15263826", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29583986767635784, "ground_truth": 0}, {"key": "15263826", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17781086844457378, "ground_truth": 0}, {"key": "15263826", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09807932471897673, "ground_truth": 0}, {"key": "37313866", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4921881339944799, "ground_truth": 0}, {"key": "37313866", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08449275151411753, "ground_truth": 0}, {"key": "37313866", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1500288289571727, "ground_truth": 0}, {"key": "37313866", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04689926402996319, "ground_truth": 0}, {"key": "37313866", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07531230622604805, "ground_truth": 0}, {"key": "13911157", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32252598464416593, "ground_truth": 0}, {"key": "13911157", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14804719563404606, "ground_truth": 0}, {"key": "13911157", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11596071498419684, "ground_truth": 0}, {"key": "13911157", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1456006407293192, "ground_truth": 0}, {"key": "13911157", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13753247148407055, "ground_truth": 0}, {"key": "39594894", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04586266273599289, "ground_truth": 0}, {"key": "39594894", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3923368382899524, "ground_truth": 0}, {"key": "39594894", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06608537425864378, "ground_truth": 0}, {"key": "39594894", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10123348419258428, "ground_truth": 0}, {"key": "39594894", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1581743521516265, "ground_truth": 0}, {"key": "34096170", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10521053405396356, "ground_truth": 0}, {"key": "34096170", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.37937839205048657, "ground_truth": 0}, {"key": "34096170", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.35042136946960417, "ground_truth": 0}, {"key": "34096170", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1530421608511525, "ground_truth": 0}, {"key": "34096170", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2351083901056951, "ground_truth": 0}, {"key": "37891952", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18010666725886554, "ground_truth": 0}, {"key": "37891952", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1329642442913062, "ground_truth": 0}, {"key": "37891952", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14706452233885522, "ground_truth": 0}, {"key": "37891952", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436783213451214, "ground_truth": 0}, {"key": "37891952", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12592277489713202, "ground_truth": 0}, {"key": "40186158", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03234433183234015, "ground_truth": 0}, {"key": "40186158", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04115288718947795, "ground_truth": 0}, {"key": "40186158", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04336580258490357, "ground_truth": 0}, {"key": "40186158", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024423091635198384, "ground_truth": 0}, {"key": "40186158", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1480471895268198, "ground_truth": 0}, {"key": "37049719", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1329642404762274, "ground_truth": 0}, {"key": "37049719", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5214711705849343, "ground_truth": 0}, {"key": "37049719", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12210387548787013, "ground_truth": 0}, {"key": "37049719", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.28140561252160423, "ground_truth": 0}, {"key": "37049719", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3023910846204938, "ground_truth": 0}, {"key": "34610504", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5736784203536567, "ground_truth": 0}, {"key": "34610504", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3495327268752357, "ground_truth": 0}, {"key": "34610504", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6951311320037359, "ground_truth": 0}, {"key": "34610504", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5612147958157849, "ground_truth": 0}, {"key": "34610504", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108560590572, "ground_truth": 0}, {"key": "37595429", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.038756196440886834, "ground_truth": 0}, {"key": "37595429", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.004215159779186254, "ground_truth": 0}, {"key": "37595429", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.015483987589080747, "ground_truth": 0}, {"key": "37595429", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01609087358992797, "ground_truth": 0}, {"key": "37595429", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027901378413463056, "ground_truth": 0}, {"key": "29772670", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27512972943714853, "ground_truth": 0}, {"key": "29772670", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5755879923079897, "ground_truth": 0}, {"key": "29772670", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6442251187691598, "ground_truth": 0}, {"key": "29772670", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416384241138, "ground_truth": 0}, {"key": "29772670", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195201361633, "ground_truth": 0}, {"key": "36369872", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09947021257093888, "ground_truth": 0}, {"key": "36369872", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.018689307130534866, "ground_truth": 0}, {"key": "36369872", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06681232841713623, "ground_truth": 0}, {"key": "36369872", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958288611233, "ground_truth": 0}, {"key": "36369872", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15203224815407368, "ground_truth": 0}, {"key": "34527433", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027376489331347387, "ground_truth": 0}, {"key": "34527433", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.029760093191902922, "ground_truth": 0}, {"key": "34527433", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.030214587974265624, "ground_truth": 0}, {"key": "34527433", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020964241629085625, "ground_truth": 0}, {"key": "34527433", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018833130667306474, "ground_truth": 0}, {"key": "31111734", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05921025144427213, "ground_truth": 0}, {"key": "31111734", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0463782067578951, "ground_truth": 0}, {"key": "31111734", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.046724957049344894, "ground_truth": 0}, {"key": "31111734", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0803574660859776, "ground_truth": 0}, {"key": "31111734", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06418263972641591, "ground_truth": 0}, {"key": "40303872", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031261914202108707, "ground_truth": 0}, {"key": "40303872", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.050893724891255494, "ground_truth": 0}, {"key": "40303872", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025565214080014515, "ground_truth": 0}, {"key": "40303872", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12043881866231555, "ground_truth": 0}, {"key": "40303872", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0960254955034054, "ground_truth": 0}, {"key": "33653553", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10087862135661244, "ground_truth": 0}, {"key": "33653553", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3775406641455149, "ground_truth": 0}, {"key": "33653553", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2893716902676111, "ground_truth": 0}, {"key": "33653553", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074559840198845, "ground_truth": 0}, {"key": "33653553", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030824552348, "ground_truth": 0}, {"key": "34404510", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03114383048466428, "ground_truth": 0}, {"key": "34404510", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.045522005798908666, "ground_truth": 0}, {"key": "34404510", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03234433088764338, "ground_truth": 0}, {"key": "34404510", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01368947897168988, "ground_truth": 0}, {"key": "34404510", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03222229591004808, "ground_truth": 0}, {"key": "35568692", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13660840518241124, "ground_truth": 0}, {"key": "35568692", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1135795919266699, "ground_truth": 0}, {"key": "35568692", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05165378303121031, "ground_truth": 0}, {"key": "35568692", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08151974832193394, "ground_truth": 0}, {"key": "35568692", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09467770118067037, "ground_truth": 0}, {"key": "39151664", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36840569905437726, "ground_truth": 0}, {"key": "39151664", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1645164547570689, "ground_truth": 0}, {"key": "39151664", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12678516888012153, "ground_truth": 0}, {"key": "39151664", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168779328857374, "ground_truth": 0}, {"key": "39151664", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678174510495, "ground_truth": 0}, {"key": "37493670", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8714748682136447, "ground_truth": 0}, {"key": "37493670", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8910549537034732, "ground_truth": 0}, {"key": "37493670", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7302898995858367, "ground_truth": 0}, {"key": "37493670", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.663668957362163, "ground_truth": 0}, {"key": "37493670", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476562667465, "ground_truth": 0}, {"key": "21935983", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1710611748707478, "ground_truth": 0}, {"key": "21935983", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10266401279261869, "ground_truth": 0}, {"key": "21935983", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1356895489323299, "ground_truth": 0}, {"key": "21935983", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.26817411284615106, "ground_truth": 0}, {"key": "21935983", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06804042478100092, "ground_truth": 0}, {"key": "38174214", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16026603740045942, "ground_truth": 0}, {"key": "38174214", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12463856144171509, "ground_truth": 0}, {"key": "38174214", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19682620319799227, "ground_truth": 0}, {"key": "38174214", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22135069156231113, "ground_truth": 0}, {"key": "38174214", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.27982850600945897, "ground_truth": 0}, {"key": "40319923", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.092032855832469, "ground_truth": 0}, {"key": "40319923", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06608537386987717, "ground_truth": 0}, {"key": "40319923", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07978201417503315, "ground_truth": 0}, {"key": "40319923", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03649376756441527, "ground_truth": 0}, {"key": "40319923", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04038906780724482, "ground_truth": 0}, {"key": "36478264", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20625380912332617, "ground_truth": 0}, {"key": "36478264", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14706452061980224, "ground_truth": 0}, {"key": "36478264", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09877258853770435, "ground_truth": 0}, {"key": "36478264", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1859472070133185, "ground_truth": 0}, {"key": "36478264", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709412606903, "ground_truth": 0}, {"key": "11935769", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02953533798981288, "ground_truth": 0}, {"key": "11935769", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.015784562630057824, "ground_truth": 0}, {"key": "11935769", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07423136593113035, "ground_truth": 0}, {"key": "11935769", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06705628916179265, "ground_truth": 0}, {"key": "11935769", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.014063627266479218, "ground_truth": 0}, {"key": "33373410", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3665897453871909, "ground_truth": 0}, {"key": "33373410", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1955940801536261, "ground_truth": 0}, {"key": "33373410", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.39981165492401716, "ground_truth": 0}, {"key": "33373410", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14706452605927817, "ground_truth": 0}, {"key": "33373410", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220564414648169, "ground_truth": 0}, {"key": "11130680", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09434340836208875, "ground_truth": 0}, {"key": "11130680", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03963884096407109, "ground_truth": 0}, {"key": "11130680", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0038393950421961465, "ground_truth": 0}, {"key": "11130680", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.025274900975502602, "ground_truth": 0}, {"key": "11130680", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015424551030406226, "ground_truth": 0}, {"key": "34868650", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05051767085864384, "ground_truth": 0}, {"key": "34868650", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03875619388030026, "ground_truth": 0}, {"key": "34868650", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04369105714689382, "ground_truth": 0}, {"key": "34868650", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03904829051239871, "ground_truth": 0}, {"key": "34868650", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03358950828411857, "ground_truth": 0}, {"key": "33960561", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22953520449841458, "ground_truth": 0}, {"key": "33960561", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13386748980214752, "ground_truth": 0}, {"key": "33960561", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13939638445695646, "ground_truth": 0}, {"key": "33960561", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449275837550668, "ground_truth": 0}, {"key": "33960561", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08509904588488072, "ground_truth": 0}, {"key": "22504858", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19314738239301416, "ground_truth": 0}, {"key": "22504858", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.34864516862927003, "ground_truth": 0}, {"key": "22504858", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4282333942663583, "ground_truth": 0}, {"key": "22504858", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591163050807, "ground_truth": 0}, {"key": "22504858", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17050800496468163, "ground_truth": 0}, {"key": "32283530", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14033625507816416, "ground_truth": 0}, {"key": "32283530", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.029986508006305524, "ground_truth": 0}, {"key": "32283530", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11201595426909229, "ground_truth": 0}, {"key": "32283530", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05419872897503105, "ground_truth": 0}, {"key": "32283530", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03608394111283695, "ground_truth": 0}, {"key": "38377099", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14080817251167196, "ground_truth": 0}, {"key": "38377099", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10230470185769051, "ground_truth": 0}, {"key": "38377099", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0980793257682298, "ground_truth": 0}, {"key": "38377099", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04569203214282254, "ground_truth": 0}, {"key": "38377099", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06512754229868445, "ground_truth": 0}, {"key": "36105123", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02359929389607302, "ground_truth": 0}, {"key": "36105123", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019197450659298797, "ground_truth": 0}, {"key": "36105123", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05665242496826997, "ground_truth": 0}, {"key": "36105123", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01572399097184342, "ground_truth": 0}, {"key": "36105123", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018124721237379793, "ground_truth": 0}, {"key": "33527826", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2365162328268119, "ground_truth": 0}, {"key": "33527826", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12126887647505981, "ground_truth": 0}, {"key": "33527826", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.253861009543325, "ground_truth": 0}, {"key": "33527826", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910918578367, "ground_truth": 0}, {"key": "33527826", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.25982563200569403, "ground_truth": 0}, {"key": "32349891", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2751297260579242, "ground_truth": 0}, {"key": "32349891", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.31405053342884537, "ground_truth": 0}, {"key": "32349891", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.531209373420891, "ground_truth": 0}, {"key": "32349891", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.221350690879481, "ground_truth": 0}, {"key": "32349891", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742627452788846, "ground_truth": 0}, {"key": "34281974", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.012100385506511192, "ground_truth": 0}, {"key": "34281974", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017110889635672585, "ground_truth": 0}, {"key": "34281974", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.028544151779427703, "ground_truth": 0}, {"key": "34281974", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03904829272191111, "ground_truth": 0}, {"key": "34281974", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05203782514229505, "ground_truth": 0}, {"key": "29387866", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14706452391582026, "ground_truth": 0}, {"key": "29387866", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2925953094747254, "ground_truth": 0}, {"key": "29387866", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6132365583454046, "ground_truth": 0}, {"key": "29387866", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586153485718, "ground_truth": 0}, {"key": "29387866", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1677633485236182, "ground_truth": 0}, {"key": "35731925", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4301473491894254, "ground_truth": 0}, {"key": "35731925", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2568319942358387, "ground_truth": 0}, {"key": "35731925", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.28457601411316874, "ground_truth": 0}, {"key": "35731925", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567885674473, "ground_truth": 0}, {"key": "35731925", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048022430564306, "ground_truth": 0}, {"key": "38829733", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4263215887791774, "ground_truth": 0}, {"key": "38829733", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17667161001772627, "ground_truth": 0}, {"key": "38829733", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.334589443182706, "ground_truth": 0}, {"key": "38829733", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386101964878804, "ground_truth": 0}, {"key": "38829733", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451541068483, "ground_truth": 0}, {"key": "24624736", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20561504967572053, "ground_truth": 0}, {"key": "24624736", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.072112198791237, "ground_truth": 0}, {"key": "24624736", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14080818031499695, "ground_truth": 0}, {"key": "24624736", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17217184812044667, "ground_truth": 0}, {"key": "24624736", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451645034137755, "ground_truth": 0}, {"key": "36928562", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17441027051322316, "ground_truth": 0}, {"key": "36928562", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.43590152504912094, "ground_truth": 0}, {"key": "36928562", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.34158248422488313, "ground_truth": 0}, {"key": "36928562", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30652705855215245, "ground_truth": 0}, {"key": "36928562", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414526975951, "ground_truth": 0}, {"key": "34941119", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.059866419265881265, "ground_truth": 0}, {"key": "34941119", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.027169232405825527, "ground_truth": 0}, {"key": "34941119", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01724277757587014, "ground_truth": 0}, {"key": "34941119", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.041930524330823726, "ground_truth": 0}, {"key": "34941119", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012821214293628801, "ground_truth": 0}, {"key": "30206231", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6001883499033178, "ground_truth": 0}, {"key": "30206231", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7057850283772251, "ground_truth": 0}, {"key": "30206231", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12506538737890033, "ground_truth": 0}, {"key": "30206231", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.36840572113543163, "ground_truth": 0}, {"key": "30206231", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658975577670094, "ground_truth": 0}, {"key": "35584972", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1384617922075881, "ground_truth": 0}, {"key": "35584972", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15817434952626186, "ground_truth": 0}, {"key": "35584972", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1613202436234945, "ground_truth": 0}, {"key": "35584972", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12506538290368988, "ground_truth": 0}, {"key": "35584972", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2068940565229944, "ground_truth": 0}, {"key": "39277709", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2018132268242019, "ground_truth": 0}, {"key": "39277709", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04369105735933419, "ground_truth": 0}, {"key": "39277709", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14903530822260644, "ground_truth": 0}, {"key": "39277709", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.040237941209090286, "ground_truth": 0}, {"key": "39277709", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09268777952354726, "ground_truth": 0}, {"key": "36123657", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08449276053001031, "ground_truth": 0}, {"key": "36123657", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.037608634267823036, "ground_truth": 0}, {"key": "36123657", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027585281644643387, "ground_truth": 0}, {"key": "36123657", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09534946147094665, "ground_truth": 0}, {"key": "36123657", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05070536135709672, "ground_truth": 0}, {"key": "33363938", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05520868712885793, "ground_truth": 0}, {"key": "33363938", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.010818447390876517, "ground_truth": 0}, {"key": "33363938", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.036220058349083796, "ground_truth": 0}, {"key": "33363938", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04385456442797456, "ground_truth": 0}, {"key": "33363938", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.044348580890848754, "ground_truth": 0}, {"key": "37349129", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23370634860030554, "ground_truth": 0}, {"key": "37349129", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4629586174601704, "ground_truth": 0}, {"key": "37349129", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6076631581688766, "ground_truth": 0}, {"key": "37349129", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995891853502, "ground_truth": 0}, {"key": "37349129", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366073964744, "ground_truth": 0}, {"key": "37160199", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10158944965503716, "ground_truth": 0}, {"key": "37160199", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21206881849951983, "ground_truth": 0}, {"key": "37160199", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18952109921333954, "ground_truth": 0}, {"key": "37160199", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12252321616697384, "ground_truth": 0}, {"key": "37160199", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14223188176077178, "ground_truth": 0}, {"key": "35891053", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04501552987561172, "ground_truth": 0}, {"key": "35891053", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12336561700404255, "ground_truth": 0}, {"key": "35891053", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09739040110296997, "ground_truth": 0}, {"key": "35891053", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2704802210347955, "ground_truth": 0}, {"key": "35891053", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072403281287603, "ground_truth": 0}, {"key": "40694542", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05127241553098204, "ground_truth": 0}, {"key": "40694542", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.023330767434182206, "ground_truth": 0}, {"key": "40694542", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03663136643474885, "ground_truth": 0}, {"key": "40694542", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.056236349394981504, "ground_truth": 0}, {"key": "40694542", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.041462277682797234, "ground_truth": 0}, {"key": "24645770", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2598256472438654, "ground_truth": 0}, {"key": "24645770", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4130035734106164, "ground_truth": 0}, {"key": "24645770", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3830641923393747, "ground_truth": 0}, {"key": "24645770", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25982565095540566, "ground_truth": 0}, {"key": "24645770", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20181322392830287, "ground_truth": 0}, {"key": "37974587", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11357958618986144, "ground_truth": 0}, {"key": "37974587", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10594827399824616, "ground_truth": 0}, {"key": "37974587", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18594720616211116, "ground_truth": 0}, {"key": "37974587", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213447315919, "ground_truth": 0}, {"key": "37974587", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13117322297972492, "ground_truth": 0}, {"key": "40354149", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13477591554480056, "ground_truth": 0}, {"key": "40354149", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.022629202297035203, "ground_truth": 0}, {"key": "40354149", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2583259880816889, "ground_truth": 0}, {"key": "40354149", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09534945959783095, "ground_truth": 0}, {"key": "40354149", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04831607115275427, "ground_truth": 0}, {"key": "35519470", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03321117070159312, "ground_truth": 0}, {"key": "35519470", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.011823395374574483, "ground_truth": 0}, {"key": "35519470", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06656918481111061, "ground_truth": 0}, {"key": "35519470", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02017731886616163, "ground_truth": 0}, {"key": "35519470", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05379964413888591, "ground_truth": 0}, {"key": "36185624", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10230470408062668, "ground_truth": 0}, {"key": "36185624", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21733751618915306, "ground_truth": 0}, {"key": "36185624", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1883239896043815, "ground_truth": 0}, {"key": "36185624", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1778108635933276, "ground_truth": 0}, {"key": "36185624", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13206615540933922, "ground_truth": 0}, {"key": "39306113", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18126321180424518, "ground_truth": 0}, {"key": "39306113", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4902356188251857, "ground_truth": 0}, {"key": "39306113", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0775176571626651, "ground_truth": 0}, {"key": "39306113", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055767370733968, "ground_truth": 0}, {"key": "39306113", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2798285052903783, "ground_truth": 0}, {"key": "19347718", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0333368245709042, "ground_truth": 0}, {"key": "19347718", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026657739512736426, "ground_truth": 0}, {"key": "19347718", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04023794436598567, "ground_truth": 0}, {"key": "19347718", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05146276414959506, "ground_truth": 0}, {"key": "19347718", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04256272947811444, "ground_truth": 0}, {"key": "21870064", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10374863011851186, "ground_truth": 0}, {"key": "21870064", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00857748552185567, "ground_truth": 0}, {"key": "21870064", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.023870835461865393, "ground_truth": 0}, {"key": "21870064", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.00825159896251876, "ground_truth": 0}, {"key": "21870064", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.025957357702319377, "ground_truth": 0}, {"key": "37675776", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.012527933696332004, "ground_truth": 0}, {"key": "37675776", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.018404890864742868, "ground_truth": 0}, {"key": "37675776", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01048909194515894, "ground_truth": 0}, {"key": "37675776", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.027169231137606928, "ground_truth": 0}, {"key": "37675776", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015189049868625194, "ground_truth": 0}, {"key": "38107017", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03890198178184027, "ground_truth": 0}, {"key": "38107017", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03635666527488636, "ground_truth": 0}, {"key": "38107017", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19806417267499676, "ground_truth": 0}, {"key": "38107017", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022542965667995015, "ground_truth": 0}, {"key": "38107017", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015247590910265939, "ground_truth": 0}, {"key": "40046472", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.003607616762043996, "ground_truth": 0}, {"key": "40046472", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.018194367605674402, "ground_truth": 0}, {"key": "40046472", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.016029147098995628, "ground_truth": 0}, {"key": "40046472", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03090896096970149, "ground_truth": 0}, {"key": "40046472", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018978037624693828, "ground_truth": 0}, {"key": "32157820", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11838509485272192, "ground_truth": 0}, {"key": "32157820", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2674081726207592, "ground_truth": 0}, {"key": "32157820", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.390475847219004, "ground_truth": 0}, {"key": "32157820", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12085323667358934, "ground_truth": 0}, {"key": "32157820", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23231016038742144, "ground_truth": 0}, {"key": "41004037", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24364244903723378, "ground_truth": 0}, {"key": "41004037", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1460872549168519, "ground_truth": 0}, {"key": "41004037", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18126320397740864, "ground_truth": 0}, {"key": "41004037", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08945459641379952, "ground_truth": 0}, {"key": "41004037", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13477591732227281, "ground_truth": 0}, {"key": "21387993", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27982851249190505, "ground_truth": 0}, {"key": "21387993", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22815650642429422, "ground_truth": 0}, {"key": "21387993", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.32082131075253273, "ground_truth": 0}, {"key": "21387993", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436466642937, "ground_truth": 0}, {"key": "21387993", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09138210398270931, "ground_truth": 0}, {"key": "34665539", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0539988380148826, "ground_truth": 0}, {"key": "34665539", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0869416630714322, "ground_truth": 0}, {"key": "34665539", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05728196947379191, "ground_truth": 0}, {"key": "34665539", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07004895709044535, "ground_truth": 0}, {"key": "34665539", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05320620136038499, "ground_truth": 0}, {"key": "37872111", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11201596384670055, "ground_truth": 0}, {"key": "37872111", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12940272597496064, "ground_truth": 0}, {"key": "37872111", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.357567519832659, "ground_truth": 0}, {"key": "37872111", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594721412795007, "ground_truth": 0}, {"key": "37872111", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2590751001757873, "ground_truth": 0}, {"key": "36629542", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06210312166743856, "ground_truth": 0}, {"key": "36629542", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06142403704720418, "ground_truth": 0}, {"key": "36629542", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04193052547858692, "ground_truth": 0}, {"key": "36629542", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04922211184852983, "ground_truth": 0}, {"key": "36629542", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.031858857083443624, "ground_truth": 0}, {"key": "36487527", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07978201476516102, "ground_truth": 0}, {"key": "36487527", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0403890678773442, "ground_truth": 0}, {"key": "36487527", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04518375484910049, "ground_truth": 0}, {"key": "36487527", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03283695380972842, "ground_truth": 0}, {"key": "36487527", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05561761145853748, "ground_truth": 0}, {"key": "37344756", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13660840138052474, "ground_truth": 0}, {"key": "37344756", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04468087331852828, "ground_truth": 0}, {"key": "37344756", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04742587147867511, "ground_truth": 0}, {"key": "37344756", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06705628756270607, "ground_truth": 0}, {"key": "37344756", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.014337030238205985, "ground_truth": 0}, {"key": "38707722", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05921024834556836, "ground_truth": 0}, {"key": "38707722", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0313804329604819, "ground_truth": 0}, {"key": "38707722", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.018264278362749846, "ground_truth": 0}, {"key": "38707722", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03258974229161552, "ground_truth": 0}, {"key": "38707722", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.046551274723018156, "ground_truth": 0}, {"key": "37093419", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18359363231004874, "ground_truth": 0}, {"key": "37093419", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.057071397911947125, "ground_truth": 0}, {"key": "37093419", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07864238176471944, "ground_truth": 0}, {"key": "37093419", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07423136574725671, "ground_truth": 0}, {"key": "37093419", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414435330308, "ground_truth": 0}, {"key": "35547391", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17667159985950673, "ground_truth": 0}, {"key": "35547391", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1789558908080296, "ground_truth": 0}, {"key": "35547391", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11757213901280884, "ground_truth": 0}, {"key": "35547391", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687308221199836, "ground_truth": 0}, {"key": "35547391", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1778108762236148, "ground_truth": 0}, {"key": "37173168", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03258974259859126, "ground_truth": 0}, {"key": "37173168", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0603076347551976, "ground_truth": 0}, {"key": "37173168", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03608394331502281, "ground_truth": 0}, {"key": "37173168", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03126191491153239, "ground_truth": 0}, {"key": "37173168", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03197955908459404, "ground_truth": 0}, {"key": "30725298", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09534946423449947, "ground_truth": 0}, {"key": "30725298", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08035746773618195, "ground_truth": 0}, {"key": "30725298", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.060086647974963964, "ground_truth": 0}, {"key": "30725298", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09138210903395877, "ground_truth": 0}, {"key": "30725298", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09401018619261804, "ground_truth": 0}, {"key": "33830573", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04885778072849612, "ground_truth": 0}, {"key": "33830573", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1276526254909608, "ground_truth": 0}, {"key": "33830573", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05480259662094586, "ground_truth": 0}, {"key": "33830573", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14706452341636658, "ground_truth": 0}, {"key": "33830573", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06853749177728814, "ground_truth": 0}, {"key": "33415474", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3090236985934984, "ground_truth": 0}, {"key": "33415474", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.30902370031179366, "ground_truth": 0}, {"key": "33415474", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15304216213497637, "ground_truth": 0}, {"key": "33415474", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06560483366395557, "ground_truth": 0}, {"key": "33415474", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1688569558587798, "ground_truth": 0}, {"key": "37383994", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11920292250858863, "ground_truth": 0}, {"key": "37383994", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09877259161420278, "ground_truth": 0}, {"key": "37383994", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09203285686491808, "ground_truth": 0}, {"key": "37383994", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.081812713331843, "ground_truth": 0}, {"key": "37383994", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421300880380642, "ground_truth": 0}, {"key": "38576819", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9111797102369197, "ground_truth": 0}, {"key": "38576819", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6279511917199246, "ground_truth": 0}, {"key": "38576819", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9847524095096132, "ground_truth": 0}, {"key": "38576819", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9473810423695341, "ground_truth": 0}, {"key": "38576819", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9656413116390735, "ground_truth": 0}, {"key": "34500226", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02865267049565337, "ground_truth": 0}, {"key": "34500226", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03704716922202905, "ground_truth": 0}, {"key": "34500226", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.030908961060887866, "ground_truth": 0}, {"key": "34500226", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024053554226043744, "ground_truth": 0}, {"key": "34500226", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.025957357005019163, "ground_truth": 0}, {"key": "39856394", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05379964405083018, "ground_truth": 0}, {"key": "39856394", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.034100427216134405, "ground_truth": 0}, {"key": "39856394", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025760560406194594, "ground_truth": 0}, {"key": "39856394", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05223085267340171, "ground_truth": 0}, {"key": "39856394", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.020177320204479012, "ground_truth": 0}, {"key": "35499522", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25534363628954515, "ground_truth": 0}, {"key": "35499522", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6169358049438078, "ground_truth": 0}, {"key": "35499522", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09073548029467829, "ground_truth": 0}, {"key": "35499522", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22884513415460317, "ground_truth": 0}, {"key": "35499522", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10374863666409269, "ground_truth": 0}, {"key": "30157766", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03594832436069222, "ground_truth": 0}, {"key": "30157766", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07558478102739676, "ground_truth": 0}, {"key": "30157766", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06954174361119694, "ground_truth": 0}, {"key": "30157766", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10932482444233237, "ground_truth": 0}, {"key": "30157766", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798743551551006, "ground_truth": 0}, {"key": "40472346", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09203286164944982, "ground_truth": 0}, {"key": "40472346", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09602549579781353, "ground_truth": 0}, {"key": "40472346", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06394842064869873, "ground_truth": 0}, {"key": "40472346", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05791808598744606, "ground_truth": 0}, {"key": "40472346", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.049039619422836536, "ground_truth": 0}, {"key": "35305635", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27357439636263226, "ground_truth": 0}, {"key": "35305635", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12252322013300548, "ground_truth": 0}, {"key": "35305635", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20181322223128817, "ground_truth": 0}, {"key": "35305635", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.255343656027809, "ground_truth": 0}, {"key": "35305635", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06142403918875911, "ground_truth": 0}, {"key": "32495926", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014172365395397648, "ground_truth": 0}, {"key": "32495926", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.054399321078307854, "ground_truth": 0}, {"key": "32495926", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04434857999049951, "ground_truth": 0}, {"key": "32495926", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04115288605137039, "ground_truth": 0}, {"key": "32495926", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10194651736854392, "ground_truth": 0}, {"key": "37353801", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010818447364942387, "ground_truth": 0}, {"key": "37353801", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02737649002673732, "ground_truth": 0}, {"key": "37353801", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06233103628035239, "ground_truth": 0}, {"key": "37353801", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.035948323600278526, "ground_truth": 0}, {"key": "37353801", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.031618766975630215, "ground_truth": 0}, {"key": "30159904", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02080449058802754, "ground_truth": 0}, {"key": "30159904", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.022802637695407416, "ground_truth": 0}, {"key": "30159904", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.044348581498300156, "ground_truth": 0}, {"key": "30159904", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.011687257590478645, "ground_truth": 0}, {"key": "30159904", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023153409284129445, "ground_truth": 0}, {"key": "33698679", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01861780158876785, "ground_truth": 0}, {"key": "33698679", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04831607163059175, "ground_truth": 0}, {"key": "33698679", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.037186775309607435, "ground_truth": 0}, {"key": "33698679", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03581319371220149, "ground_truth": 0}, {"key": "33698679", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.050893721328048334, "ground_truth": 0}, {"key": "40530172", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4148988416490285, "ground_truth": 0}, {"key": "40530172", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0956869395052123, "ground_truth": 0}, {"key": "40530172", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2450850093450538, "ground_truth": 0}, {"key": "40530172", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0479581020482992, "ground_truth": 0}, {"key": "40530172", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06608537520699395, "ground_truth": 0}, {"key": "40652941", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1143685173786296, "ground_truth": 0}, {"key": "40652941", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05500528601226032, "ground_truth": 0}, {"key": "40652941", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09268778238667152, "ground_truth": 0}, {"key": "40652941", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06187599009468308, "ground_truth": 0}, {"key": "40652941", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04620574955203355, "ground_truth": 0}, {"key": "40122246", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36749723765524334, "ground_truth": 0}, {"key": "40122246", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1480471913515955, "ground_truth": 0}, {"key": "40122246", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.34158249962872006, "ground_truth": 0}, {"key": "40122246", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3233800965705821, "ground_truth": 0}, {"key": "40122246", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937837105305855, "ground_truth": 0}, {"key": "40032656", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31405056702444123, "ground_truth": 0}, {"key": "40032656", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08756384623519403, "ground_truth": 0}, {"key": "40032656", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09947021180981061, "ground_truth": 0}, {"key": "40032656", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815650338409926, "ground_truth": 0}, {"key": "40032656", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15405756491545655, "ground_truth": 0}, {"key": "38913680", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02479816048811276, "ground_truth": 0}, {"key": "38913680", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012722708261782265, "ground_truth": 0}, {"key": "38913680", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0323443298845172, "ground_truth": 0}, {"key": "38913680", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01472861391030357, "ground_truth": 0}, {"key": "38913680", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03594832332183807, "ground_truth": 0}, {"key": "17608039", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31069439371358, "ground_truth": 0}, {"key": "17608039", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.29910518809361736, "ground_truth": 0}, {"key": "17608039", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.38121956003815805, "ground_truth": 0}, {"key": "17608039", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18476751988065523, "ground_truth": 0}, {"key": "17608039", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252599251786734, "ground_truth": 0}, {"key": "40434901", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05300976987347307, "ground_truth": 0}, {"key": "40434901", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04401865411915038, "ground_truth": 0}, {"key": "40434901", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02194825437209849, "ground_truth": 0}, {"key": "40434901", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08570927944342922, "ground_truth": 0}, {"key": "40434901", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04795810368017961, "ground_truth": 0}, {"key": "37680058", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06853749626432211, "ground_truth": 0}, {"key": "37680058", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09009299925423431, "ground_truth": 0}, {"key": "37680058", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12085322756564333, "ground_truth": 0}, {"key": "37680058", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02737648965918368, "ground_truth": 0}, {"key": "37680058", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08389038723649109, "ground_truth": 0}, {"key": "37291821", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0665691890552032, "ground_truth": 0}, {"key": "37291821", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.010052368220430988, "ground_truth": 0}, {"key": "37291821", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.014899643067600919, "ground_truth": 0}, {"key": "37291821", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.019419346819961266, "ground_truth": 0}, {"key": "37291821", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027272668784667393, "ground_truth": 0}, {"key": "41002743", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12421300684309902, "ground_truth": 0}, {"key": "41002743", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27512973723824075, "ground_truth": 0}, {"key": "41002743", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2613309214484851, "ground_truth": 0}, {"key": "41002743", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1347759185010584, "ground_truth": 0}, {"key": "41002743", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2674081670183439, "ground_truth": 0}, {"key": "36322869", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09947021352480971, "ground_truth": 0}, {"key": "36322869", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13753247742909638, "ground_truth": 0}, {"key": "36322869", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.062103120202544916, "ground_truth": 0}, {"key": "36322869", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06804041995189256, "ground_truth": 0}, {"key": "36322869", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0548025930523488, "ground_truth": 0}, {"key": "39459717", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35577489033079623, "ground_truth": 0}, {"key": "39459717", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16238003233677795, "ground_truth": 0}, {"key": "39459717", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.36477756694842584, "ground_truth": 0}, {"key": "39459717", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398146416497924, "ground_truth": 0}, {"key": "39459717", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988410495566, "ground_truth": 0}, {"key": "36503727", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04672495519456853, "ground_truth": 0}, {"key": "36503727", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0399373164692507, "ground_truth": 0}, {"key": "36503727", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02655657280710988, "ground_truth": 0}, {"key": "36503727", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05707139783294606, "ground_truth": 0}, {"key": "36503727", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03622006001145295, "ground_truth": 0}, {"key": "35682367", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.37570647687981235, "ground_truth": 0}, {"key": "35682367", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9105454006860818, "ground_truth": 0}, {"key": "35682367", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02976009386907971, "ground_truth": 0}, {"key": "35682367", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276682934647882, "ground_truth": 0}, {"key": "35682367", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9500414730001127, "ground_truth": 0}, {"key": "36472353", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2628418610174863, "ground_truth": 0}, {"key": "36472353", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05707140059059972, "ground_truth": 0}, {"key": "36472353", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.011597362280542287, "ground_truth": 0}, {"key": "36472353", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.032713125047528525, "ground_truth": 0}, {"key": "36472353", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04146227668582241, "ground_truth": 0}, {"key": "37651907", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.017375664652401025, "ground_truth": 0}, {"key": "37651907", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02423763624433228, "ground_truth": 0}, {"key": "37651907", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03222229796281528, "ground_truth": 0}, {"key": "37651907", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08694166050102178, "ground_truth": 0}, {"key": "37651907", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12592277451898035, "ground_truth": 0}, {"key": "36255476", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01659317791724921, "ground_truth": 0}, {"key": "36255476", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013689477330402159, "ground_truth": 0}, {"key": "36255476", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.021864556856028748, "ground_truth": 0}, {"key": "36255476", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03934250665391749, "ground_truth": 0}, {"key": "36255476", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024798162246146296, "ground_truth": 0}, {"key": "37283518", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23934935171462257, "ground_truth": 0}, {"key": "37283518", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.34334174992460476, "ground_truth": 0}, {"key": "37283518", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.31742628250138133, "ground_truth": 0}, {"key": "37283518", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052822432143, "ground_truth": 0}, {"key": "37283518", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733750853420808, "ground_truth": 0}, {"key": "34906785", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01627746025738506, "ground_truth": 0}, {"key": "34906785", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.007785655474379549, "ground_truth": 0}, {"key": "34906785", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01317195052866094, "ground_truth": 0}, {"key": "34906785", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.010693758706634785, "ground_truth": 0}, {"key": "34906785", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.019719126619944998, "ground_truth": 0}, {"key": "34965328", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03448852620835791, "ground_truth": 0}, {"key": "34965328", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017442483372615218, "ground_truth": 0}, {"key": "34965328", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02145073066398697, "ground_truth": 0}, {"key": "34965328", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020567097538492497, "ground_truth": 0}, {"key": "34965328", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03541072581251876, "ground_truth": 0}, {"key": "38788440", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03044434982134352, "ground_truth": 0}, {"key": "38788440", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20307463886306854, "ground_truth": 0}, {"key": "38788440", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0726367081449706, "ground_truth": 0}, {"key": "38788440", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0663268718386018, "ground_truth": 0}, {"key": "38788440", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07055960026418638, "ground_truth": 0}, {"key": "35046866", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12808824669155022, "ground_truth": 0}, {"key": "35046866", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06233103881668123, "ground_truth": 0}, {"key": "35046866", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1901218422472631, "ground_truth": 0}, {"key": "35046866", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08035746703738358, "ground_truth": 0}, {"key": "35046866", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1343210555464797, "ground_truth": 0}, {"key": "37629558", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1008786157286062, "ground_truth": 0}, {"key": "37629558", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13206614441921105, "ground_truth": 0}, {"key": "37629558", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23091975484935107, "ground_truth": 0}, {"key": "37629558", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815650475980875, "ground_truth": 0}, {"key": "37629558", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1818436447274993, "ground_truth": 0}, {"key": "33859914", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1645164570190872, "ground_truth": 0}, {"key": "33859914", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19682621896943597, "ground_truth": 0}, {"key": "33859914", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25534363827092166, "ground_truth": 0}, {"key": "33859914", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596071325093253, "ground_truth": 0}, {"key": "33859914", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414453461208, "ground_truth": 0}, {"key": "39790523", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0587765616070294, "ground_truth": 0}, {"key": "39790523", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.055208690689492995, "ground_truth": 0}, {"key": "39790523", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0718512684478031, "ground_truth": 0}, {"key": "39790523", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08570927647002959, "ground_truth": 0}, {"key": "39790523", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05582314301532386, "ground_truth": 0}, {"key": "33509656", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2991051844847909, "ground_truth": 0}, {"key": "33509656", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3575675142365707, "ground_truth": 0}, {"key": "33509656", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12678517812774298, "ground_truth": 0}, {"key": "33509656", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064689757349, "ground_truth": 0}, {"key": "33509656", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051951473412, "ground_truth": 0}, {"key": "17380923", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18242552269538423, "ground_truth": 0}, {"key": "17380923", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.052618955527272665, "ground_truth": 0}, {"key": "17380923", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06608537433122967, "ground_truth": 0}, {"key": "17380923", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10521053733970417, "ground_truth": 0}, {"key": "17380923", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07696083702149567, "ground_truth": 0}, {"key": "36202526", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22270014871481328, "ground_truth": 0}, {"key": "36202526", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15507847730424978, "ground_truth": 0}, {"key": "36202526", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13296424962025288, "ground_truth": 0}, {"key": "36202526", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08819004570123799, "ground_truth": 0}, {"key": "36202526", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.175538076362027, "ground_truth": 0}, {"key": "26419232", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.015072629790958185, "ground_truth": 0}, {"key": "26419232", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02920129082383381, "ground_truth": 0}, {"key": "26419232", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01646617453251205, "ground_truth": 0}, {"key": "26419232", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.028980631645611002, "ground_truth": 0}, {"key": "26419232", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023962027157646996, "ground_truth": 0}, {"key": "34232398", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04069295421175363, "ground_truth": 0}, {"key": "34232398", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09670578982630385, "ground_truth": 0}, {"key": "34232398", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0644176673704234, "ground_truth": 0}, {"key": "34232398", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030444350464860936, "ground_truth": 0}, {"key": "34232398", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08064661426414614, "ground_truth": 0}, {"key": "33586045", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07107366809614983, "ground_truth": 0}, {"key": "33586045", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03541072873083508, "ground_truth": 0}, {"key": "33586045", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04099902820584564, "ground_truth": 0}, {"key": "33586045", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05242456022411245, "ground_truth": 0}, {"key": "33586045", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.038756196696405606, "ground_truth": 0}, {"key": "32281151", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0960254891164678, "ground_truth": 0}, {"key": "32281151", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10669059560392984, "ground_truth": 0}, {"key": "32281151", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.024423090690326648, "ground_truth": 0}, {"key": "32281151", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937170711900706, "ground_truth": 0}, {"key": "32281151", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06142404092628126, "ground_truth": 0}, {"key": "37308159", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6460137224841244, "ground_truth": 0}, {"key": "37308159", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7057850089256873, "ground_truth": 0}, {"key": "37308159", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6706082871783771, "ground_truth": 0}, {"key": "37308159", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581422406384, "ground_truth": 0}, {"key": "37308159", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9494823316474041, "ground_truth": 0}, {"key": "35694408", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1623800260575451, "ground_truth": 0}, {"key": "35694408", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0408457170518198, "ground_truth": 0}, {"key": "35694408", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07640768214793389, "ground_truth": 0}, {"key": "35694408", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01678548990892292, "ground_truth": 0}, {"key": "35694408", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0838903869066282, "ground_truth": 0}, {"key": "39781995", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3311197490096965, "ground_truth": 0}, {"key": "39781995", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07316471874775334, "ground_truth": 0}, {"key": "39781995", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06142404221603587, "ground_truth": 0}, {"key": "39781995", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660839623773954, "ground_truth": 0}, {"key": "39781995", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06008664825751031, "ground_truth": 0}, {"key": "22799372", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15765489578038785, "ground_truth": 0}, {"key": "22799372", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1048433655792729, "ground_truth": 0}, {"key": "22799372", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.015543648427818366, "ground_truth": 0}, {"key": "22799372", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07107366953300367, "ground_truth": 0}, {"key": "22799372", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07133199645441476, "ground_truth": 0}, {"key": "37428240", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01327388799638461, "ground_truth": 0}, {"key": "37428240", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04099902898626769, "ground_truth": 0}, {"key": "37428240", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.005533387813326496, "ground_truth": 0}, {"key": "37428240", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.051462763310855655, "ground_truth": 0}, {"key": "37428240", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06394842323152206, "ground_truth": 0}, {"key": "40612657", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2081789274930697, "ground_truth": 0}, {"key": "40612657", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10856642005762572, "ground_truth": 0}, {"key": "40612657", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08850466159961083, "ground_truth": 0}, {"key": "40612657", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1089450372284942, "ground_truth": 0}, {"key": "40612657", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370635119420158, "ground_truth": 0}, {"key": "34404662", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02595735632894516, "ground_truth": 0}, {"key": "34404662", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.034488523402481146, "ground_truth": 0}, {"key": "34404662", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025760560484243092, "ground_truth": 0}, {"key": "34404662", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05419872638043329, "ground_truth": 0}, {"key": "34404662", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024892802508537534, "ground_truth": 0}, {"key": "32619704", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.017848737631859617, "ground_truth": 0}, {"key": "32619704", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0646534905367282, "ground_truth": 0}, {"key": "32619704", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08151975420898373, "ground_truth": 0}, {"key": "32619704", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07640768038292599, "ground_truth": 0}, {"key": "32619704", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03488088939875252, "ground_truth": 0}, {"key": "39014883", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.004773722452018404, "ground_truth": 0}, {"key": "39014883", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028328313195897504, "ground_truth": 0}, {"key": "39014883", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.008745182105483787, "ground_truth": 0}, {"key": "39014883", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04272219875181528, "ground_truth": 0}, {"key": "39014883", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02645577735293359, "ground_truth": 0}, {"key": "37982812", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.29583986551625585, "ground_truth": 0}, {"key": "37982812", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20181322169090987, "ground_truth": 0}, {"key": "37982812", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6224593278548722, "ground_truth": 0}, {"key": "37982812", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.361164721164479, "ground_truth": 0}, {"key": "37982812", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593260131124, "ground_truth": 0}, {"key": "28123476", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10521054002867541, "ground_truth": 0}, {"key": "28123476", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2689414399566228, "ground_truth": 0}, {"key": "28123476", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.28937170228628467, "ground_truth": 0}, {"key": "28123476", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436429484039, "ground_truth": 0}, {"key": "28123476", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1968262089471378, "ground_truth": 0}, {"key": "39078849", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03210070766540022, "ground_truth": 0}, {"key": "39078849", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00985985500011171, "ground_truth": 0}, {"key": "39078849", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03185885647519889, "ground_truth": 0}, {"key": "39078849", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0028228329607125446, "ground_truth": 0}, {"key": "39078849", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012241275486088917, "ground_truth": 0}, {"key": "39414137", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.513668470663539, "ground_truth": 0}, {"key": "39414137", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.47073660875876705, "ground_truth": 0}, {"key": "39414137", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23091974628649903, "ground_truth": 0}, {"key": "39414137", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21272225478714393, "ground_truth": 0}, {"key": "39414137", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2766905490723536, "ground_truth": 0}, {"key": "37371354", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028220987610805253, "ground_truth": 0}, {"key": "37371354", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17781087759840214, "ground_truth": 0}, {"key": "37371354", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03346293440347338, "ground_truth": 0}, {"key": "37371354", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03663136685705601, "ground_truth": 0}, {"key": "37371354", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667540392337776, "ground_truth": 0}, {"key": "29497179", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15921740488100866, "ground_truth": 0}, {"key": "29497179", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13939638514142128, "ground_truth": 0}, {"key": "29497179", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05223085278302459, "ground_truth": 0}, {"key": "29497179", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.476579638795861, "ground_truth": 0}, {"key": "29497179", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512036044115, "ground_truth": 0}, {"key": "35908694", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2735743848437134, "ground_truth": 0}, {"key": "35908694", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13028541614688302, "ground_truth": 0}, {"key": "35908694", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07211220347138882, "ground_truth": 0}, {"key": "35908694", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.056236347608834954, "ground_truth": 0}, {"key": "35908694", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06097518075140703, "ground_truth": 0}, {"key": "37619358", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.46490158432508394, "ground_truth": 0}, {"key": "37619358", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27669053521095827, "ground_truth": 0}, {"key": "37619358", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2689414461812094, "ground_truth": 0}, {"key": "37619358", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906243663621, "ground_truth": 0}, {"key": "37619358", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953520870034752, "ground_truth": 0}, {"key": "37293103", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27202456549482973, "ground_truth": 0}, {"key": "37293103", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3174262881600639, "ground_truth": 0}, {"key": "37293103", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5698526522048526, "ground_truth": 0}, {"key": "37293103", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253748055049, "ground_truth": 0}, {"key": "37293103", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064700189582, "ground_truth": 0}, {"key": "36883729", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6976089000747853, "ground_truth": 0}, {"key": "36883729", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.727975463175256, "ground_truth": 0}, {"key": "36883729", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5774953600819845, "ground_truth": 0}, {"key": "36883729", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8037905983543049, "ground_truth": 0}, {"key": "36883729", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545657258415, "ground_truth": 0}, {"key": "39209521", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010529711652933212, "ground_truth": 0}, {"key": "39209521", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0073173976657704785, "ground_truth": 0}, {"key": "39209521", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010611420796453417, "ground_truth": 0}, {"key": "39209521", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.015906390930545918, "ground_truth": 0}, {"key": "39209521", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008644177639911297, "ground_truth": 0}, {"key": "27792571", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09877258885281485, "ground_truth": 0}, {"key": "27792571", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.038756193680295356, "ground_truth": 0}, {"key": "27792571", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05033062938877653, "ground_truth": 0}, {"key": "27792571", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02790137821407231, "ground_truth": 0}, {"key": "27792571", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09534945941120435, "ground_truth": 0}, {"key": "39755647", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09203285986083143, "ground_truth": 0}, {"key": "39755647", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09203285732622263, "ground_truth": 0}, {"key": "39755647", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.014842417939962282, "ground_truth": 0}, {"key": "39755647", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03271312724218734, "ground_truth": 0}, {"key": "39755647", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07477004543821486, "ground_truth": 0}, {"key": "40800537", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0838903872777641, "ground_truth": 0}, {"key": "40800537", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10669059174655438, "ground_truth": 0}, {"key": "40800537", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.257578267577567, "ground_truth": 0}, {"key": "40800537", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07978201348278663, "ground_truth": 0}, {"key": "40800537", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13986564649396518, "ground_truth": 0}, {"key": "14171461", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.024516336815431007, "ground_truth": 0}, {"key": "14171461", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.040237944843414974, "ground_truth": 0}, {"key": "14171461", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02976009260119323, "ground_truth": 0}, {"key": "14171461", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0329612451028571, "ground_truth": 0}, {"key": "14171461", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.014063626871932312, "ground_truth": 0}, {"key": "36892440", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1267851681702537, "ground_truth": 0}, {"key": "36892440", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.31573598661318514, "ground_truth": 0}, {"key": "36892440", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16238003434877324, "ground_truth": 0}, {"key": "36892440", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09105828941354248, "ground_truth": 0}, {"key": "36892440", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2049777417276427, "ground_truth": 0}, {"key": "33733410", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15921740014723912, "ground_truth": 0}, {"key": "33733410", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16451645338871182, "ground_truth": 0}, {"key": "33733410", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07004896200806428, "ground_truth": 0}, {"key": "33733410", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10230470536853381, "ground_truth": 0}, {"key": "33733410", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13028541624941892, "ground_truth": 0}, {"key": "38587765", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4785288456413277, "ground_truth": 0}, {"key": "38587765", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32082128538026045, "ground_truth": 0}, {"key": "38587765", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4320633828851738, "ground_truth": 0}, {"key": "38587765", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29665426728155786, "ground_truth": 0}, {"key": "38587765", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.32680832518549224, "ground_truth": 0}, {"key": "41065582", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05707140294126425, "ground_truth": 0}, {"key": "41065582", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15817435038534258, "ground_truth": 0}, {"key": "41065582", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2893717140814537, "ground_truth": 0}, {"key": "41065582", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09009299184354846, "ground_truth": 0}, {"key": "41065582", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121674985237, "ground_truth": 0}, {"key": "34713891", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9597620586694059, "ground_truth": 0}, {"key": "34713891", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1710611818182345, "ground_truth": 0}, {"key": "34713891", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06142403746715026, "ground_truth": 0}, {"key": "34713891", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11162800244790161, "ground_truth": 0}, {"key": "34713891", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07864238306737244, "ground_truth": 0}, {"key": "18913023", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1451153657482611, "ground_truth": 0}, {"key": "18913023", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6306849142179208, "ground_truth": 0}, {"key": "18913023", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.464901565574849, "ground_truth": 0}, {"key": "18913023", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011666178758, "ground_truth": 0}, {"key": "18913023", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688113198746, "ground_truth": 0}, {"key": "36884100", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.048496000911095315, "ground_truth": 0}, {"key": "36884100", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08509904282990396, "ground_truth": 0}, {"key": "36884100", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.060086649766869386, "ground_truth": 0}, {"key": "36884100", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12421300734072653, "ground_truth": 0}, {"key": "36884100", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1699562432865174, "ground_truth": 0}, {"key": "39899913", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0881900450901987, "ground_truth": 0}, {"key": "39899913", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06052939238872392, "ground_truth": 0}, {"key": "39899913", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025371311900527656, "ground_truth": 0}, {"key": "39899913", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.017576883889254845, "ground_truth": 0}, {"key": "39899913", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02876159015342961, "ground_truth": 0}, {"key": "30725366", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13341521800097944, "ground_truth": 0}, {"key": "30725366", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25238405073551906, "ground_truth": 0}, {"key": "30725366", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.053601139668668335, "ground_truth": 0}, {"key": "30725366", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10123347639563268, "ground_truth": 0}, {"key": "30725366", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08632347988232608, "ground_truth": 0}, {"key": "26133523", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.019050899590143725, "ground_truth": 0}, {"key": "26133523", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005301894586771433, "ground_truth": 0}, {"key": "26133523", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012722708723832086, "ground_truth": 0}, {"key": "26133523", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.026255301462774362, "ground_truth": 0}, {"key": "26133523", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0408457193573093, "ground_truth": 0}, {"key": "29332665", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31405056037337015, "ground_truth": 0}, {"key": "29332665", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05070536550528858, "ground_truth": 0}, {"key": "29332665", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2628418462213632, "ground_truth": 0}, {"key": "29332665", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561504833007083, "ground_truth": 0}, {"key": "29332665", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336561190674213, "ground_truth": 0}, {"key": "37400481", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02716923389875287, "ground_truth": 0}, {"key": "37400481", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02566270788069822, "ground_truth": 0}, {"key": "37400481", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.057281972516630884, "ground_truth": 0}, {"key": "37400481", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04922211449788195, "ground_truth": 0}, {"key": "37400481", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06164961897035227, "ground_truth": 0}, {"key": "38787241", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08269734425533042, "ground_truth": 0}, {"key": "38787241", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019419347278882778, "ground_truth": 0}, {"key": "38787241", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18832398940410777, "ground_truth": 0}, {"key": "38787241", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09602549393082897, "ground_truth": 0}, {"key": "38787241", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.046724956337875746, "ground_truth": 0}, {"key": "38225963", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03185885614293385, "ground_truth": 0}, {"key": "38225963", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026759282670831885, "ground_truth": 0}, {"key": "38225963", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08093670664968229, "ground_truth": 0}, {"key": "38225963", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08269733707772005, "ground_truth": 0}, {"key": "38225963", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213860977578, "ground_truth": 0}, {"key": "26072034", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2351083897524122, "ground_truth": 0}, {"key": "26072034", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.056652421819204775, "ground_truth": 0}, {"key": "26072034", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.035678554949647806, "ground_truth": 0}, {"key": "26072034", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689404930392405, "ground_truth": 0}, {"key": "26072034", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08269734366919468, "ground_truth": 0}, {"key": "35690810", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10302442661795608, "ground_truth": 0}, {"key": "35690810", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2160115328812366, "ground_truth": 0}, {"key": "35690810", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6531269287084058, "ground_truth": 0}, {"key": "35690810", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473419050156, "ground_truth": 0}, {"key": "35690810", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31069438537323324, "ground_truth": 0}, {"key": "36855665", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3757064891560002, "ground_truth": 0}, {"key": "36855665", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2658804829634306, "ground_truth": 0}, {"key": "36855665", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22953522506916613, "ground_truth": 0}, {"key": "36855665", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776333915482824, "ground_truth": 0}, {"key": "36855665", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24077459979693644, "ground_truth": 0}, {"key": "29757662", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.024892802787422907, "ground_truth": 0}, {"key": "29757662", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.009340024109134768, "ground_truth": 0}, {"key": "29757662", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09203286178946767, "ground_truth": 0}, {"key": "29757662", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.026556573525492552, "ground_truth": 0}, {"key": "29757662", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.032344331772991224, "ground_truth": 0}, {"key": "19134339", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04778006902437812, "ground_truth": 0}, {"key": "19134339", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08389038951415247, "ground_truth": 0}, {"key": "19134339", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0700489621105717, "ground_truth": 0}, {"key": "19134339", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238003929140352, "ground_truth": 0}, {"key": "19134339", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05623634698871151, "ground_truth": 0}, {"key": "35360732", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08299415021819195, "ground_truth": 0}, {"key": "35360732", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06705628744373313, "ground_truth": 0}, {"key": "35360732", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16238002748609134, "ground_truth": 0}, {"key": "35360732", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765261884932283, "ground_truth": 0}, {"key": "35360732", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05728197569191909, "ground_truth": 0}, {"key": "37713629", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.030214587935598596, "ground_truth": 0}, {"key": "37713629", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026657741292668513, "ground_truth": 0}, {"key": "37713629", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05184546842711976, "ground_truth": 0}, {"key": "37713629", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12506538416804489, "ground_truth": 0}, {"key": "37713629", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05184546781431181, "ground_truth": 0}, {"key": "33393394", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07133200398392824, "ground_truth": 0}, {"key": "33393394", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07316472045565522, "ground_truth": 0}, {"key": "33393394", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1699562315729682, "ground_truth": 0}, {"key": "33393394", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.058776561289757216, "ground_truth": 0}, {"key": "33393394", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08570927350955149, "ground_truth": 0}, {"key": "32275837", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07004895718747699, "ground_truth": 0}, {"key": "32275837", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07779745159154498, "ground_truth": 0}, {"key": "32275837", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2018132221434986, "ground_truth": 0}, {"key": "32275837", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.005384937739195491, "ground_truth": 0}, {"key": "32275837", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01578456146381827, "ground_truth": 0}, {"key": "21458094", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05261895535659574, "ground_truth": 0}, {"key": "21458094", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0960254877192839, "ground_truth": 0}, {"key": "21458094", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2689414441880964, "ground_truth": 0}, {"key": "21458094", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021615332611932558, "ground_truth": 0}, {"key": "21458094", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.010735162750415791, "ground_truth": 0}, {"key": "40975362", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.47073662243325326, "ground_truth": 0}, {"key": "40975362", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5214711641206579, "ground_truth": 0}, {"key": "40975362", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.622459337220266, "ground_truth": 0}, {"key": "40975362", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786363676358, "ground_truth": 0}, {"key": "40975362", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167300021641487, "ground_truth": 0}, {"key": "35234201", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4649015694688772, "ground_truth": 0}, {"key": "35234201", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.34158249519466866, "ground_truth": 0}, {"key": "35234201", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21733751732832102, "ground_truth": 0}, {"key": "35234201", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245515840075, "ground_truth": 0}, {"key": "35234201", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794003963579374, "ground_truth": 0}, {"key": "36037573", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11596071345611235, "ground_truth": 0}, {"key": "36037573", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08945460177683488, "ground_truth": 0}, {"key": "36037573", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08882028436998345, "ground_truth": 0}, {"key": "36037573", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447732393399464, "ground_truth": 0}, {"key": "36037573", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11124121649339451, "ground_truth": 0}, {"key": "30861915", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08269733608304179, "ground_truth": 0}, {"key": "30861915", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13660839552416232, "ground_truth": 0}, {"key": "30861915", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20055767825317278, "ground_truth": 0}, {"key": "30861915", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10087861704945175, "ground_truth": 0}, {"key": "30861915", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559407764502398, "ground_truth": 0}, {"key": "40173012", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23510839347834228, "ground_truth": 0}, {"key": "40173012", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3199707572295124, "ground_truth": 0}, {"key": "40173012", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2751297285901078, "ground_truth": 0}, {"key": "40173012", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653334870697682, "ground_truth": 0}, {"key": "40173012", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18892181335598984, "ground_truth": 0}, {"key": "35100330", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.243642457726674, "ground_truth": 0}, {"key": "35100330", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1789558861391138, "ground_truth": 0}, {"key": "35100330", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0980793277549018, "ground_truth": 0}, {"key": "35100330", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12085323966667955, "ground_truth": 0}, {"key": "35100330", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1744102700643635, "ground_truth": 0}, {"key": "37220221", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05379964589896313, "ground_truth": 0}, {"key": "37220221", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0897732937159088, "ground_truth": 0}, {"key": "37220221", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01379536405525475, "ground_truth": 0}, {"key": "37220221", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021698097817674313, "ground_truth": 0}, {"key": "37220221", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07558478406180125, "ground_truth": 0}, {"key": "38815218", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16344543350207952, "ground_truth": 0}, {"key": "38815218", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1895210905274733, "ground_truth": 0}, {"key": "38815218", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30239109395210173, "ground_truth": 0}, {"key": "38815218", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.183593633331996, "ground_truth": 0}, {"key": "38815218", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13753246956846107, "ground_truth": 0}, {"key": "39379109", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.011331754959531806, "ground_truth": 0}, {"key": "39379109", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.004755199968443163, "ground_truth": 0}, {"key": "39379109", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.002424914337136951, "ground_truth": 0}, {"key": "39379109", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.012194133850465434, "ground_truth": 0}, {"key": "39379109", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0042315876634637034, "ground_truth": 0}, {"key": "14576125", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04813676732451438, "ground_truth": 0}, {"key": "14576125", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.031143831728300084, "ground_truth": 0}, {"key": "14576125", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025957357527160795, "ground_truth": 0}, {"key": "14576125", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03210070755136296, "ground_truth": 0}, {"key": "14576125", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027169232791132158, "ground_truth": 0}, {"key": "40814250", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03963884032844347, "ground_truth": 0}, {"key": "40814250", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1980641756287652, "ground_truth": 0}, {"key": "40814250", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09947021177341521, "ground_truth": 0}, {"key": "40814250", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215592171327, "ground_truth": 0}, {"key": "40814250", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3867634270523536, "ground_truth": 0}, {"key": "36334488", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9416541576312005, "ground_truth": 0}, {"key": "36334488", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5331543903088668, "ground_truth": 0}, {"key": "36334488", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6876299916989309, "ground_truth": 0}, {"key": "36334488", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389969709922, "ground_truth": 0}, {"key": "36334488", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252597755085455, "ground_truth": 0}, {"key": "36888322", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24077459068770113, "ground_truth": 0}, {"key": "36888322", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3960681649925552, "ground_truth": 0}, {"key": "36888322", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.28776782701807213, "ground_truth": 0}, {"key": "36888322", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30735800493328974, "ground_truth": 0}, {"key": "36888322", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091974773259044, "ground_truth": 0}, {"key": "37318916", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3775406624371119, "ground_truth": 0}, {"key": "37318916", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08151975173749303, "ground_truth": 0}, {"key": "37318916", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21601153894235994, "ground_truth": 0}, {"key": "37318916", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2422056438433243, "ground_truth": 0}, {"key": "37318916", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07423136974433661, "ground_truth": 0}, {"key": "39308700", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.058776557778235906, "ground_truth": 0}, {"key": "39308700", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10158944419057697, "ground_truth": 0}, {"key": "39308700", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11838510327004427, "ground_truth": 0}, {"key": "39308700", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03333682358790673, "ground_truth": 0}, {"key": "39308700", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07055959981840249, "ground_truth": 0}, {"key": "31061543", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014785407579692498, "ground_truth": 0}, {"key": "31061543", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05146276116346775, "ground_truth": 0}, {"key": "31061543", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.022457056022740583, "ground_truth": 0}, {"key": "31061543", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02120611986978474, "ground_truth": 0}, {"key": "31061543", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01987071325202273, "ground_truth": 0}, {"key": "37380894", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14223189137057693, "ground_truth": 0}, {"key": "37380894", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3738758160736637, "ground_truth": 0}, {"key": "37380894", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08449276068670254, "ground_truth": 0}, {"key": "37380894", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04146227544048668, "ground_truth": 0}, {"key": "37380894", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09203286591207671, "ground_truth": 0}, {"key": "38410139", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08210663264386746, "ground_truth": 0}, {"key": "38410139", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18832398065479225, "ground_truth": 0}, {"key": "38410139", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18952109090918717, "ground_truth": 0}, {"key": "38410139", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128141158101107, "ground_truth": 0}, {"key": "38410139", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237151975293, "ground_truth": 0}, {"key": "35953842", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02876158798533046, "ground_truth": 0}, {"key": "35953842", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08601587874537275, "ground_truth": 0}, {"key": "35953842", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05051766905151982, "ground_truth": 0}, {"key": "35953842", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.039638840321242146, "ground_truth": 0}, {"key": "35953842", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.041462276361112514, "ground_truth": 0}, {"key": "39815663", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12085323292262651, "ground_truth": 0}, {"key": "39815663", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06052939139550155, "ground_truth": 0}, {"key": "39815663", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07978201258924247, "ground_truth": 0}, {"key": "39815663", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08509903934286578, "ground_truth": 0}, {"key": "39815663", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07921032226333742, "ground_truth": 0}, {"key": "35121432", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16344543329818803, "ground_truth": 0}, {"key": "35121432", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020804489332046806, "ground_truth": 0}, {"key": "35121432", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05749327690667345, "ground_truth": 0}, {"key": "35121432", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.014503580478623709, "ground_truth": 0}, {"key": "35121432", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.028761588909877234, "ground_truth": 0}, {"key": "21712310", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09877259386737056, "ground_truth": 0}, {"key": "21712310", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.042403826155826004, "ground_truth": 0}, {"key": "21712310", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025565213078303672, "ground_truth": 0}, {"key": "21712310", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10743746999456072, "ground_truth": 0}, {"key": "21712310", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07477004777900331, "ground_truth": 0}, {"key": "37952914", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05749327699610208, "ground_truth": 0}, {"key": "37952914", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07640767745811818, "ground_truth": 0}, {"key": "37952914", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.057493275249363526, "ground_truth": 0}, {"key": "37952914", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08509903928121058, "ground_truth": 0}, {"key": "37952914", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09739039880001606, "ground_truth": 0}, {"key": "38956779", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9746286899068533, "ground_truth": 0}, {"key": "38956779", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5019531268175491, "ground_truth": 0}, {"key": "38956779", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6723316888852183, "ground_truth": 0}, {"key": "38956779", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199773898747, "ground_truth": 0}, {"key": "38956779", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9640516768029946, "ground_truth": 0}, {"key": "36101833", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03963883953975331, "ground_truth": 0}, {"key": "36101833", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.023241926292594035, "ground_truth": 0}, {"key": "36101833", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08151975324824669, "ground_truth": 0}, {"key": "36101833", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02405355395614649, "ground_truth": 0}, {"key": "36101833", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023330768726219902, "ground_truth": 0}, {"key": "35544662", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06656919202744818, "ground_truth": 0}, {"key": "35544662", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00881316656784392, "ground_truth": 0}, {"key": "35544662", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0474258721105104, "ground_truth": 0}, {"key": "35544662", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03803509689213652, "ground_truth": 0}, {"key": "35544662", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06853749147186566, "ground_truth": 0}, {"key": "39759044", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1581743619198266, "ground_truth": 0}, {"key": "39759044", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09636510271317626, "ground_truth": 0}, {"key": "39759044", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2180027193428606, "ground_truth": 0}, {"key": "39759044", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2759094566593191, "ground_truth": 0}, {"key": "39759044", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09367799836833587, "ground_truth": 0}, {"key": "39433018", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06608537976792958, "ground_truth": 0}, {"key": "39433018", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04603389789573956, "ground_truth": 0}, {"key": "39433018", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.050330635443721176, "ground_truth": 0}, {"key": "39433018", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02470386740335028, "ground_truth": 0}, {"key": "39433018", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05281402562948095, "ground_truth": 0}, {"key": "22111959", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7853085866022269, "ground_truth": 0}, {"key": "22111959", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09602549424752861, "ground_truth": 0}, {"key": "22111959", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.37204879415087794, "ground_truth": 0}, {"key": "22111959", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1030244275379139, "ground_truth": 0}, {"key": "22111959", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09947020552551819, "ground_truth": 0}, {"key": "38210094", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02161533203158077, "ground_truth": 0}, {"key": "38210094", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01191502318861389, "ground_truth": 0}, {"key": "38210094", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04501553274261607, "ground_truth": 0}, {"key": "38210094", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013171949608394927, "ground_truth": 0}, {"key": "38210094", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040540740318617874, "ground_truth": 0}, {"key": "37675935", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8322366576317539, "ground_truth": 0}, {"key": "37675935", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9469902227178147, "ground_truth": 0}, {"key": "37675935", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9339146223650758, "ground_truth": 0}, {"key": "37675935", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.937668960876015, "ground_truth": 0}, {"key": "37675935", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070049185707, "ground_truth": 0}, {"key": "35732604", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2942149692788912, "ground_truth": 0}, {"key": "35732604", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.322526001911933, "ground_truth": 0}, {"key": "35732604", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06278920843547497, "ground_truth": 0}, {"key": "35732604", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167930891645, "ground_truth": 0}, {"key": "35732604", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798744069557485, "ground_truth": 0}, {"key": "27453212", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09842542161090533, "ground_truth": 0}, {"key": "27453212", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17272931067598474, "ground_truth": 0}, {"key": "27453212", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09334688067162698, "ground_truth": 0}, {"key": "27453212", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1470645341579971, "ground_truth": 0}, {"key": "27453212", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11279539698843462, "ground_truth": 0}, {"key": "39910047", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04867657192329306, "ground_truth": 0}, {"key": "39910047", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06301947043437757, "ground_truth": 0}, {"key": "39910047", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.029090758105559004, "ground_truth": 0}, {"key": "39910047", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0507053638174844, "ground_truth": 0}, {"key": "39910047", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05749327602533975, "ground_truth": 0}, {"key": "40054265", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1812632103466511, "ground_truth": 0}, {"key": "40054265", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08449275323368997, "ground_truth": 0}, {"key": "40054265", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25238403924113073, "ground_truth": 0}, {"key": "40054265", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.44939263462708784, "ground_truth": 0}, {"key": "40054265", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.038321974427472205, "ground_truth": 0}, {"key": "19984615", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3345894523158063, "ground_truth": 0}, {"key": "19984615", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12126888156349239, "ground_truth": 0}, {"key": "19984615", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1436676108395953, "ground_truth": 0}, {"key": "19984615", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09912085839125129, "ground_truth": 0}, {"key": "19984615", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1913276806295854, "ground_truth": 0}, {"key": "16490806", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.015365341856870584, "ground_truth": 0}, {"key": "16490806", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.016657040474021362, "ground_truth": 0}, {"key": "16490806", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03461884019722921, "ground_truth": 0}, {"key": "16490806", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02153287850487274, "ground_truth": 0}, {"key": "16490806", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.019419346488293767, "ground_truth": 0}, {"key": "36396237", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5774953828480881, "ground_truth": 0}, {"key": "36396237", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5234203325706357, "ground_truth": 0}, {"key": "36396237", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6113819721237657, "ground_truth": 0}, {"key": "36396237", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512714382225, "ground_truth": 0}, {"key": "36396237", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990694030828, "ground_truth": 0}, {"key": "40726444", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07668380240445061, "ground_truth": 0}, {"key": "40726444", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07751765384591909, "ground_truth": 0}, {"key": "40726444", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19012183521107884, "ground_truth": 0}, {"key": "40726444", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.059646940924656784, "ground_truth": 0}, {"key": "40726444", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06325052599225947, "ground_truth": 0}, {"key": "37314826", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13568955024759596, "ground_truth": 0}, {"key": "37314826", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10017222633025519, "ground_truth": 0}, {"key": "37314826", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08299414919132223, "ground_truth": 0}, {"key": "37314826", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838509587153376, "ground_truth": 0}, {"key": "37314826", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08756383941664139, "ground_truth": 0}, {"key": "38506971", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04115288625190205, "ground_truth": 0}, {"key": "38506971", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026556572982144, "ground_truth": 0}, {"key": "38506971", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01730909729253308, "ground_truth": 0}, {"key": "38506971", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.031618766993582195, "ground_truth": 0}, {"key": "38506971", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05921025578006163, "ground_truth": 0}, {"key": "40699312", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13028542318415437, "ground_truth": 0}, {"key": "40699312", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18010666196691774, "ground_truth": 0}, {"key": "40699312", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07921032224539391, "ground_truth": 0}, {"key": "40699312", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04084571715109874, "ground_truth": 0}, {"key": "40699312", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.061875984651587244, "ground_truth": 0}, {"key": "34695474", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016979991560934715, "ground_truth": 0}, {"key": "34695474", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0043653260403366066, "ground_truth": 0}, {"key": "34695474", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.018334452620348055, "ground_truth": 0}, {"key": "34695474", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021044567781028384, "ground_truth": 0}, {"key": "34695474", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008478401648493053, "ground_truth": 0}, {"key": "36281498", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7534666505335097, "ground_truth": 0}, {"key": "36281498", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8449215302137013, "ground_truth": 0}, {"key": "36281498", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6001883287347188, "ground_truth": 0}, {"key": "36281498", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772264029285, "ground_truth": 0}, {"key": "36281498", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199693824424, "ground_truth": 0}, {"key": "39558652", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08756384927150462, "ground_truth": 0}, {"key": "39558652", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1417559952628371, "ground_truth": 0}, {"key": "39558652", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25238404774287837, "ground_truth": 0}, {"key": "39558652", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015242089778, "ground_truth": 0}, {"key": "39558652", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20817893420739966, "ground_truth": 0}, {"key": "37330579", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.017045317055342048, "ground_truth": 0}, {"key": "37330579", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06878728573651373, "ground_truth": 0}, {"key": "37330579", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09235980302138314, "ground_truth": 0}, {"key": "37330579", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10411240907536008, "ground_truth": 0}, {"key": "37330579", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17895589085264552, "ground_truth": 0}, {"key": "40547658", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12336561674959902, "ground_truth": 0}, {"key": "40547658", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22541661059862023, "ground_truth": 0}, {"key": "40547658", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11838509782975305, "ground_truth": 0}, {"key": "40547658", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07978201303229268, "ground_truth": 0}, {"key": "40547658", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05480259369995408, "ground_truth": 0}, {"key": "37119340", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.006513498095588794, "ground_truth": 0}, {"key": "37119340", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012147170716286017, "ground_truth": 0}, {"key": "37119340", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01646617527580185, "ground_truth": 0}, {"key": "37119340", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01411789415866541, "ground_truth": 0}, {"key": "37119340", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0034564099144504873, "ground_truth": 0}, {"key": "35301627", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09912085470039578, "ground_truth": 0}, {"key": "35301627", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05834583707407575, "ground_truth": 0}, {"key": "35301627", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05986642052644775, "ground_truth": 0}, {"key": "35301627", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.046033901421985005, "ground_truth": 0}, {"key": "35301627", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04434858228071074, "ground_truth": 0}, {"key": "34037168", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07978201557509214, "ground_truth": 0}, {"key": "34037168", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11047115106616849, "ground_truth": 0}, {"key": "34037168", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07949570326864744, "ground_truth": 0}, {"key": "34037168", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13251456735530528, "ground_truth": 0}, {"key": "34037168", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12002563129433616, "ground_truth": 0}, {"key": "39703862", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1955940683679886, "ground_truth": 0}, {"key": "39703862", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21469140235846093, "ground_truth": 0}, {"key": "39703862", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19314737614066668, "ground_truth": 0}, {"key": "39703862", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128141984621923, "ground_truth": 0}, {"key": "39703862", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1883239964493467, "ground_truth": 0}, {"key": "16554814", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20946968810799724, "ground_truth": 0}, {"key": "16554814", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7994423254602976, "ground_truth": 0}, {"key": "16554814", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12252321481782812, "ground_truth": 0}, {"key": "16554814", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3665897521602086, "ground_truth": 0}, {"key": "16554814", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544874516276463, "ground_truth": 0}, {"key": "32983099", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22405545239495073, "ground_truth": 0}, {"key": "32983099", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03649376887242241, "ground_truth": 0}, {"key": "32983099", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15253652179397317, "ground_truth": 0}, {"key": "32983099", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06681232654757326, "ground_truth": 0}, {"key": "32983099", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669059281755916, "ground_truth": 0}, {"key": "41072994", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713685011369782, "ground_truth": 0}, {"key": "41072994", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04434857919451281, "ground_truth": 0}, {"key": "41072994", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.028007520831372656, "ground_truth": 0}, {"key": "41072994", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01812472039837508, "ground_truth": 0}, {"key": "41072994", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06142403932667841, "ground_truth": 0}, {"key": "38396247", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1495313904643051, "ground_truth": 0}, {"key": "38396247", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18010666417722415, "ground_truth": 0}, {"key": "38396247", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15974101747466787, "ground_truth": 0}, {"key": "38396247", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418472409209, "ground_truth": 0}, {"key": "38396247", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615696012459, "ground_truth": 0}, {"key": "37507998", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021615331649810776, "ground_truth": 0}, {"key": "37507998", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005001672636927081, "ground_truth": 0}, {"key": "37507998", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05749327316810299, "ground_truth": 0}, {"key": "37507998", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02451633755920489, "ground_truth": 0}, {"key": "37507998", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016529556697441238, "ground_truth": 0}, {"key": "32593929", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0376086360933877, "ground_truth": 0}, {"key": "32593929", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.014227045694344917, "ground_truth": 0}, {"key": "32593929", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05707140327130969, "ground_truth": 0}, {"key": "32593929", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04272219765888484, "ground_truth": 0}, {"key": "32593929", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03875619258264894, "ground_truth": 0}, {"key": "36056449", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06325052485927242, "ground_truth": 0}, {"key": "36056449", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01678549049327061, "ground_truth": 0}, {"key": "36056449", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.030908960272738234, "ground_truth": 0}, {"key": "36056449", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008677717177556362, "ground_truth": 0}, {"key": "36056449", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0844927562592028, "ground_truth": 0}, {"key": "21986185", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9777138146349736, "ground_truth": 0}, {"key": "21986185", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15713685735201066, "ground_truth": 0}, {"key": "21986185", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3311197626422245, "ground_truth": 0}, {"key": "21986185", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1789558875894308, "ground_truth": 0}, {"key": "21986185", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117972495607, "ground_truth": 0}, {"key": "40757465", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.042562730374730115, "ground_truth": 0}, {"key": "40757465", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09334687908385678, "ground_truth": 0}, {"key": "40757465", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02779562419567593, "ground_truth": 0}, {"key": "40757465", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09877258778177025, "ground_truth": 0}, {"key": "40757465", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14511535160749003, "ground_truth": 0}, {"key": "35198313", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20561505073292452, "ground_truth": 0}, {"key": "35198313", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15817435576548775, "ground_truth": 0}, {"key": "35198313", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1602660243246026, "ground_truth": 0}, {"key": "35198313", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06371499113133021, "ground_truth": 0}, {"key": "35198313", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.055412794343589186, "ground_truth": 0}, {"key": "30604618", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03789242502917116, "ground_truth": 0}, {"key": "30604618", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.032222299048892296, "ground_truth": 0}, {"key": "30604618", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10484336009678495, "ground_truth": 0}, {"key": "30604618", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05561761212230505, "ground_truth": 0}, {"key": "30604618", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12463856898595502, "ground_truth": 0}, {"key": "35779006", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04760265590565619, "ground_truth": 0}, {"key": "35779006", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08329192829454184, "ground_truth": 0}, {"key": "35779006", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04401865407316878, "ground_truth": 0}, {"key": "35779006", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07477004458064683, "ground_truth": 0}, {"key": "35779006", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.034229321129144404, "ground_truth": 0}, {"key": "33858956", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04569203249848135, "ground_truth": 0}, {"key": "33858956", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17441027919426708, "ground_truth": 0}, {"key": "33858956", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05964694100062658, "ground_truth": 0}, {"key": "33858956", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07807816268335392, "ground_truth": 0}, {"key": "33858956", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1338674947603885, "ground_truth": 0}, {"key": "38633880", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031026178615183166, "ground_truth": 0}, {"key": "38633880", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07585818180712149, "ground_truth": 0}, {"key": "38633880", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.062331036914589646, "ground_truth": 0}, {"key": "38633880", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06008664640524882, "ground_truth": 0}, {"key": "38633880", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.035678554268815665, "ground_truth": 0}, {"key": "36654905", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7655933594032059, "ground_truth": 0}, {"key": "36654905", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6768335386728664, "ground_truth": 0}, {"key": "36654905", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6044573030069565, "ground_truth": 0}, {"key": "36654905", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.70035711585847, "ground_truth": 0}, {"key": "36654905", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8088988645139066, "ground_truth": 0}, {"key": "26547482", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0705595983029614, "ground_truth": 0}, {"key": "26547482", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028870908098652448, "ground_truth": 0}, {"key": "26547482", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11279539673792308, "ground_truth": 0}, {"key": "26547482", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10087861728033332, "ground_truth": 0}, {"key": "26547482", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07159119891394689, "ground_truth": 0}, {"key": "36439068", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04054073807701085, "ground_truth": 0}, {"key": "36439068", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0753123051543485, "ground_truth": 0}, {"key": "36439068", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03222229938910663, "ground_truth": 0}, {"key": "36439068", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07423136812971039, "ground_truth": 0}, {"key": "36439068", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05856082439027343, "ground_truth": 0}, {"key": "30501258", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "30501258", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6315942850809985, "ground_truth": 0}, {"key": "30501258", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2991051857597132, "ground_truth": 0}, {"key": "30501258", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.261330928274602, "ground_truth": 0}, {"key": "30501258", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408930011274, "ground_truth": 0}, {"key": "37560941", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10087861286897179, "ground_truth": 0}, {"key": "37560941", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05813159502564756, "ground_truth": 0}, {"key": "37560941", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19193277981255108, "ground_truth": 0}, {"key": "37560941", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05964694133230351, "ground_truth": 0}, {"key": "37560941", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04724971393862675, "ground_truth": 0}, {"key": "36801665", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06754669082622224, "ground_truth": 0}, {"key": "36801665", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02527490161390719, "ground_truth": 0}, {"key": "36801665", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01267373471696665, "ground_truth": 0}, {"key": "36801665", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03789242703218418, "ground_truth": 0}, {"key": "36801665", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03346293374213741, "ground_truth": 0}, {"key": "34954610", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028220986385623252, "ground_truth": 0}, {"key": "34954610", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05261895485991112, "ground_truth": 0}, {"key": "34954610", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03789242623488355, "ground_truth": 0}, {"key": "34954610", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03067579997593123, "ground_truth": 0}, {"key": "34954610", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.047074180611375034, "ground_truth": 0}, {"key": "37020510", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16026603400099068, "ground_truth": 0}, {"key": "37020510", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10374862658227194, "ground_truth": 0}, {"key": "37020510", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06954174220562831, "ground_truth": 0}, {"key": "37020510", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08093670964297633, "ground_truth": 0}, {"key": "37020510", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1613202438727026, "ground_truth": 0}, {"key": "38064637", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4148988315480796, "ground_truth": 0}, {"key": "38064637", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.37754066313003015, "ground_truth": 0}, {"key": "38064637", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6388352656715459, "ground_truth": 0}, {"key": "38064637", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368291681955, "ground_truth": 0}, {"key": "38064637", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737907630496, "ground_truth": 0}, {"key": "40886108", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10594827688878122, "ground_truth": 0}, {"key": "40886108", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11920292286392466, "ground_truth": 0}, {"key": "40886108", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09073548124074375, "ground_truth": 0}, {"key": "40886108", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09739040355741838, "ground_truth": 0}, {"key": "40886108", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10743747127878024, "ground_truth": 0}, {"key": "38554603", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.035410726807150746, "ground_truth": 0}, {"key": "38554603", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08882028901607844, "ground_truth": 0}, {"key": "38554603", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09947020615148415, "ground_truth": 0}, {"key": "38554603", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.116764010324286, "ground_truth": 0}, {"key": "38554603", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106118577169302, "ground_truth": 0}, {"key": "39115586", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14318771188843266, "ground_truth": 0}, {"key": "39115586", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08329192269619683, "ground_truth": 0}, {"key": "39115586", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17553807936851554, "ground_truth": 0}, {"key": "39115586", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776334840787152, "ground_truth": 0}, {"key": "39115586", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1540575644766599, "ground_truth": 0}, {"key": "38786314", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18952109074779988, "ground_truth": 0}, {"key": "38786314", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17895589952954585, "ground_truth": 0}, {"key": "38786314", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29098086836657905, "ground_truth": 0}, {"key": "38786314", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061682677995, "ground_truth": 0}, {"key": "38786314", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121952366228, "ground_truth": 0}, {"key": "38721078", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03594832380007781, "ground_truth": 0}, {"key": "38721078", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.014447853443305236, "ground_truth": 0}, {"key": "38721078", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0675466918482039, "ground_truth": 0}, {"key": "38721078", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.048496000072933955, "ground_truth": 0}, {"key": "38721078", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.034358687078684384, "ground_truth": 0}, {"key": "39475467", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24798744284987687, "ground_truth": 0}, {"key": "39475467", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05749327556628407, "ground_truth": 0}, {"key": "39475467", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25683200703665443, "ground_truth": 0}, {"key": "39475467", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10230470769864461, "ground_truth": 0}, {"key": "39475467", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.259825633451043, "ground_truth": 0}, {"key": "35691234", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3056973210170287, "ground_truth": 0}, {"key": "35691234", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.480478661608029, "ground_truth": 0}, {"key": "35691234", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.32252596727394756, "ground_truth": 0}, {"key": "35691234", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510840257340648, "ground_truth": 0}, {"key": "35691234", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1824255380316676, "ground_truth": 0}, {"key": "36871390", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09334687154203004, "ground_truth": 0}, {"key": "36871390", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04958902417026482, "ground_truth": 0}, {"key": "36871390", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.031380431265844964, "ground_truth": 0}, {"key": "36871390", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05146276248673097, "ground_truth": 0}, {"key": "36871390", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14414885160175814, "ground_truth": 0}, {"key": "31730844", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3276682942406377, "ground_truth": 0}, {"key": "31730844", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18010665721032632, "ground_truth": 0}, {"key": "31730844", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2674081626843917, "ground_truth": 0}, {"key": "31730844", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953520717240053, "ground_truth": 0}, {"key": "31730844", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559408399895373, "ground_truth": 0}, {"key": "30810940", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.033972000447733214, "ground_truth": 0}, {"key": "30810940", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00982179368696189, "ground_truth": 0}, {"key": "30810940", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0072608663072778, "ground_truth": 0}, {"key": "30810940", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02112519337696935, "ground_truth": 0}, {"key": "30810940", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.030100336271128982, "ground_truth": 0}, {"key": "39352003", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7634837647204725, "ground_truth": 0}, {"key": "39352003", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8925625199943358, "ground_truth": 0}, {"key": "39352003", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9092645136964902, "ground_truth": 0}, {"key": "39352003", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9416541596846363, "ground_truth": 0}, {"key": "39352003", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070054913551, "ground_truth": 0}, {"key": "40118123", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01665704043392985, "ground_truth": 0}, {"key": "40118123", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02645577765652751, "ground_truth": 0}, {"key": "40118123", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.008544330826936411, "ground_truth": 0}, {"key": "40118123", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02056709725198381, "ground_truth": 0}, {"key": "40118123", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01233610104228951, "ground_truth": 0}, {"key": "37114191", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010693758253944348, "ground_truth": 0}, {"key": "37114191", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02675928456377398, "ground_truth": 0}, {"key": "37114191", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03746750782834375, "ground_truth": 0}, {"key": "37114191", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0508937203206112, "ground_truth": 0}, {"key": "37114191", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0221165904204676, "ground_truth": 0}, {"key": "39268203", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.024145422449025004, "ground_truth": 0}, {"key": "39268203", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03718677469877745, "ground_truth": 0}, {"key": "39268203", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.023419943922881735, "ground_truth": 0}, {"key": "39268203", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018689307446117177, "ground_truth": 0}, {"key": "39268203", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.043528141333223594, "ground_truth": 0}, {"key": "37950968", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05582314292599844, "ground_truth": 0}, {"key": "37950968", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21601153536020146, "ground_truth": 0}, {"key": "37950968", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06979492100131754, "ground_truth": 0}, {"key": "37950968", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07369627523989994, "ground_truth": 0}, {"key": "37950968", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13753247552510928, "ground_truth": 0}, {"key": "34959807", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.108945035273905, "ground_truth": 0}, {"key": "34959807", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09203286425048061, "ground_truth": 0}, {"key": "34959807", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.054198732196314665, "ground_truth": 0}, {"key": "34959807", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04208772830845083, "ground_truth": 0}, {"key": "34959807", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0660853728362655, "ground_truth": 0}, {"key": "35631314", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14318770172693968, "ground_truth": 0}, {"key": "35631314", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0456920319764781, "ground_truth": 0}, {"key": "35631314", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07159119759397999, "ground_truth": 0}, {"key": "35631314", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04795810294146505, "ground_truth": 0}, {"key": "35631314", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027169232051261514, "ground_truth": 0}, {"key": "38082365", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11838509894605011, "ground_truth": 0}, {"key": "38082365", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0556176145147493, "ground_truth": 0}, {"key": "38082365", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06278920604015097, "ground_truth": 0}, {"key": "38082365", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.048676575286865614, "ground_truth": 0}, {"key": "38082365", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03963884039598983, "ground_truth": 0}, {"key": "37242829", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.026355352938075415, "ground_truth": 0}, {"key": "37242829", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026355352424548846, "ground_truth": 0}, {"key": "37242829", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.011777843493220138, "ground_truth": 0}, {"key": "37242829", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02442309106891658, "ground_truth": 0}, {"key": "37242829", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.011687257116466532, "ground_truth": 0}, {"key": "38556068", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.006003595428278326, "ground_truth": 0}, {"key": "38556068", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.008061992242862427, "ground_truth": 0}, {"key": "38556068", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01036815720935394, "ground_truth": 0}, {"key": "38556068", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.005730246622012261, "ground_truth": 0}, {"key": "38556068", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.005620035928570919, "ground_truth": 0}, {"key": "32969336", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.012821214418736479, "ground_truth": 0}, {"key": "32969336", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.041773880783823644, "ground_truth": 0}, {"key": "32969336", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010611420832904174, "ground_truth": 0}, {"key": "32969336", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.011115013912993727, "ground_truth": 0}, {"key": "32969336", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015723990797843708, "ground_truth": 0}, {"key": "36825153", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8407826033164314, "ground_truth": 0}, {"key": "36825153", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8799743706462763, "ground_truth": 0}, {"key": "36825153", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7813306239637511, "ground_truth": 0}, {"key": "36825153", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9076402023076909, "ground_truth": 0}, {"key": "36825153", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8929365378235047, "ground_truth": 0}, {"key": "41050146", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15921739698357426, "ground_truth": 0}, {"key": "41050146", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1081889603889591, "ground_truth": 0}, {"key": "41050146", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10447731837562409, "ground_truth": 0}, {"key": "41050146", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009582005725, "ground_truth": 0}, {"key": "41050146", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.835483542681774, "ground_truth": 0}, {"key": "27865037", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13117322747196966, "ground_truth": 0}, {"key": "27865037", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03138043228400003, "ground_truth": 0}, {"key": "27865037", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05541279434418326, "ground_truth": 0}, {"key": "27865037", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1167640067423956, "ground_truth": 0}, {"key": "27865037", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069383045186, "ground_truth": 0}, {"key": "39868565", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4244119971589508, "ground_truth": 0}, {"key": "39868565", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1962094095104112, "ground_truth": 0}, {"key": "39868565", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19559407267841641, "ground_truth": 0}, {"key": "39868565", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541662121450254, "ground_truth": 0}, {"key": "39868565", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.172171859529383, "ground_truth": 0}, {"key": "37761968", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02153287851900247, "ground_truth": 0}, {"key": "37761968", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08449275424169947, "ground_truth": 0}, {"key": "37761968", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01912403851622495, "ground_truth": 0}, {"key": "37761968", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016466175698556355, "ground_truth": 0}, {"key": "37761968", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012241275776908945, "ground_truth": 0}, {"key": "16326139", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4035668647944696, "ground_truth": 0}, {"key": "16326139", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.41774647956590166, "ground_truth": 0}, {"key": "16326139", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27202455569291284, "ground_truth": 0}, {"key": "16326139", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.44939263988577927, "ground_truth": 0}, {"key": "16326139", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4330221949375702, "ground_truth": 0}, {"key": "36568381", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14414885711535352, "ground_truth": 0}, {"key": "36568381", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15102779926141474, "ground_truth": 0}, {"key": "36568381", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15713684778051612, "ground_truth": 0}, {"key": "36568381", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07779744801325376, "ground_truth": 0}, {"key": "36568381", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08570928175164029, "ground_truth": 0}, {"key": "39855613", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16451645163098796, "ground_truth": 0}, {"key": "39855613", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07531230885831482, "ground_truth": 0}, {"key": "39855613", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19314737474037044, "ground_truth": 0}, {"key": "39855613", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06164961924472272, "ground_truth": 0}, {"key": "39855613", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10052487213377714, "ground_truth": 0}, {"key": "29856302", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07343005519944201, "ground_truth": 0}, {"key": "29856302", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.023153411440552905, "ground_truth": 0}, {"key": "29856302", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0067975315340232005, "ground_truth": 0}, {"key": "29856302", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008093290693288603, "ground_truth": 0}, {"key": "29856302", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03846619401444624, "ground_truth": 0}, {"key": "35641106", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03934250210338852, "ground_truth": 0}, {"key": "35641106", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03704717299878824, "ground_truth": 0}, {"key": "35641106", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05033063370011628, "ground_truth": 0}, {"key": "35641106", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030214588523269817, "ground_truth": 0}, {"key": "35641106", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12002563598302543, "ground_truth": 0}, {"key": "39474558", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03258974190343524, "ground_truth": 0}, {"key": "39474558", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02112519374954994, "ground_truth": 0}, {"key": "39474558", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.031143832846536438, "ground_truth": 0}, {"key": "39474558", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024423092053898105, "ground_truth": 0}, {"key": "39474558", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.022802638446003685, "ground_truth": 0}, {"key": "34338135", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027480694349552703, "ground_truth": 0}, {"key": "34338135", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012336100621929452, "ground_truth": 0}, {"key": "34338135", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02822098858129162, "ground_truth": 0}, {"key": "34338135", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04637820724883996, "ground_truth": 0}, {"key": "34338135", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.00867771715434594, "ground_truth": 0}, {"key": "35870330", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2735743930105659, "ground_truth": 0}, {"key": "35870330", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12168575387206068, "ground_truth": 0}, {"key": "35870330", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2068940460909197, "ground_truth": 0}, {"key": "35870330", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1907240332423564, "ground_truth": 0}, {"key": "35870330", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14318770398246536, "ground_truth": 0}, {"key": "24478245", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.30239109968729716, "ground_truth": 0}, {"key": "24478245", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.39793842674280683, "ground_truth": 0}, {"key": "24478245", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21206880919725646, "ground_truth": 0}, {"key": "24478245", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.327668302172809, "ground_truth": 0}, {"key": "24478245", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384023314653, "ground_truth": 0}, {"key": "38485946", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11486403387995882, "ground_truth": 0}, {"key": "38485946", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05042407036570875, "ground_truth": 0}, {"key": "38485946", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07463503811431842, "ground_truth": 0}, {"key": "38485946", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05023736267787778, "ground_truth": 0}, {"key": "38485946", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11075936557626444, "ground_truth": 0}, {"key": "32509613", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.40922079585684906, "ground_truth": 0}, {"key": "32509613", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16667540286952084, "ground_truth": 0}, {"key": "32509613", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3942009370085192, "ground_truth": 0}, {"key": "32509613", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583988166332675, "ground_truth": 0}, {"key": "32509613", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108488182498, "ground_truth": 0}, {"key": "34078819", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18713268994049975, "ground_truth": 0}, {"key": "34078819", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15203225086397756, "ground_truth": 0}, {"key": "34078819", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14657521045050995, "ground_truth": 0}, {"key": "34078819", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09041372464235906, "ground_truth": 0}, {"key": "34078819", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2523840538264049, "ground_truth": 0}, {"key": "39523865", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27982850815913224, "ground_truth": 0}, {"key": "39523865", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12252321083071578, "ground_truth": 0}, {"key": "39523865", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2133771755446492, "ground_truth": 0}, {"key": "39523865", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18832398368384604, "ground_truth": 0}, {"key": "39523865", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13892842436562028, "ground_truth": 0}, {"key": "33146158", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20561505271125602, "ground_truth": 0}, {"key": "33146158", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18952109437634043, "ground_truth": 0}, {"key": "33146158", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22405546177185653, "ground_truth": 0}, {"key": "33146158", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436852542709575, "ground_truth": 0}, {"key": "33146158", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11124121467486196, "ground_truth": 0}, {"key": "32083974", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "32083974", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16885695764046707, "ground_truth": 0}, {"key": "32083974", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.47463119099350004, "ground_truth": 0}, {"key": "32083974", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358508232263, "ground_truth": 0}, {"key": "32083974", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990673698465, "ground_truth": 0}, {"key": "34378482", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36749723854442923, "ground_truth": 0}, {"key": "34378482", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5019531241968428, "ground_truth": 0}, {"key": "34378482", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.31237000707709467, "ground_truth": 0}, {"key": "34378482", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1993080158116582, "ground_truth": 0}, {"key": "34378482", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2798285045266378, "ground_truth": 0}, {"key": "38080102", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10970577310548409, "ground_truth": 0}, {"key": "38080102", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09434341399118185, "ground_truth": 0}, {"key": "38080102", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07807816314930484, "ground_truth": 0}, {"key": "38080102", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05770531407434824, "ground_truth": 0}, {"key": "38080102", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08210663345660077, "ground_truth": 0}, {"key": "40244537", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10230470934312247, "ground_truth": 0}, {"key": "40244537", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0129703879326721, "ground_truth": 0}, {"key": "40244537", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09670578518289072, "ground_truth": 0}, {"key": "40244537", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958372131678, "ground_truth": 0}, {"key": "40244537", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06008664851512513, "ground_truth": 0}, {"key": "33497789", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.032222298804910815, "ground_truth": 0}, {"key": "33497789", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02748069350295163, "ground_truth": 0}, {"key": "33497789", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02790137774960051, "ground_truth": 0}, {"key": "33497789", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.023689470790536973, "ground_truth": 0}, {"key": "33497789", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023509451657791256, "ground_truth": 0}, {"key": "28816889", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6706082883884107, "ground_truth": 0}, {"key": "28816889", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18126319817721523, "ground_truth": 0}, {"key": "28816889", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3056973383238581, "ground_truth": 0}, {"key": "28816889", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17781087097296944, "ground_truth": 0}, {"key": "28816889", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10818895794234605, "ground_truth": 0}, {"key": "38157127", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8596637582003241, "ground_truth": 0}, {"key": "38157127", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05419873127973884, "ground_truth": 0}, {"key": "38157127", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7041601170654792, "ground_truth": 0}, {"key": "38157127", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681866019402, "ground_truth": 0}, {"key": "38157127", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1943678153023651, "ground_truth": 0}, {"key": "36183569", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16995623666057447, "ground_truth": 0}, {"key": "36183569", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2798284926433435, "ground_truth": 0}, {"key": "36183569", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20561504565002245, "ground_truth": 0}, {"key": "36183569", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081662749599, "ground_truth": 0}, {"key": "36183569", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3539863011596887, "ground_truth": 0}, {"key": "36012016", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.040845717915476566, "ground_truth": 0}, {"key": "36012016", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013070784377093386, "ground_truth": 0}, {"key": "36012016", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04518375626665473, "ground_truth": 0}, {"key": "36012016", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02064593052448445, "ground_truth": 0}, {"key": "36012016", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02010023557309965, "ground_truth": 0}, {"key": "34571973", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12506537993378794, "ground_truth": 0}, {"key": "34571973", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.030444348961848538, "ground_truth": 0}, {"key": "34571973", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12168575146429597, "ground_truth": 0}, {"key": "34571973", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.025178843455078755, "ground_truth": 0}, {"key": "34571973", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0570713988066332, "ground_truth": 0}, {"key": "38707498", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4513265187464523, "ground_truth": 0}, {"key": "38707498", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16721866829022058, "ground_truth": 0}, {"key": "38707498", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.39981164707212885, "ground_truth": 0}, {"key": "38707498", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08663206988961297, "ground_truth": 0}, {"key": "38707498", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04867657058657227, "ground_truth": 0}, {"key": "35459082", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32766828402164194, "ground_truth": 0}, {"key": "35459082", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14706452032070244, "ground_truth": 0}, {"key": "35459082", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17217184969208216, "ground_truth": 0}, {"key": "35459082", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185261642192, "ground_truth": 0}, {"key": "35459082", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893716976459166, "ground_truth": 0}, {"key": "39464041", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6451199087408731, "ground_truth": 0}, {"key": "39464041", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.640635839289677, "ground_truth": 0}, {"key": "39464041", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6774739970100687, "ground_truth": 0}, {"key": "39464041", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5457699482289236, "ground_truth": 0}, {"key": "39464041", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6522413998189801, "ground_truth": 0}, {"key": "23782052", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.012576347980235875, "ground_truth": 0}, {"key": "23782052", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03474962886400767, "ground_truth": 0}, {"key": "23782052", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.041462274672155436, "ground_truth": 0}, {"key": "23782052", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01912403721406611, "ground_truth": 0}, {"key": "23782052", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.026657740557841543, "ground_truth": 0}, {"key": "36568455", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0474258757067276, "ground_truth": 0}, {"key": "36568455", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04672495508311223, "ground_truth": 0}, {"key": "36568455", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.046551270206281616, "ground_truth": 0}, {"key": "36568455", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07211219671559585, "ground_truth": 0}, {"key": "36568455", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07585818419825983, "ground_truth": 0}, {"key": "38469552", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0351448467123851, "ground_truth": 0}, {"key": "38469552", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017712299358163652, "ground_truth": 0}, {"key": "38469552", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010611420428848412, "ground_truth": 0}, {"key": "38469552", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021864558781424414, "ground_truth": 0}, {"key": "38469552", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024053552852405735, "ground_truth": 0}, {"key": "35922277", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11436852512925123, "ground_truth": 0}, {"key": "35922277", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08756384419200175, "ground_truth": 0}, {"key": "35922277", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0675466974388444, "ground_truth": 0}, {"key": "35922277", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.025957357716174037, "ground_truth": 0}, {"key": "35922277", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06097518347400286, "ground_truth": 0}, {"key": "32744293", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04672495737934343, "ground_truth": 0}, {"key": "32744293", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22270014071867347, "ground_truth": 0}, {"key": "32744293", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4687906333580144, "ground_truth": 0}, {"key": "32744293", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806415944213018, "ground_truth": 0}, {"key": "32744293", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15203225201553905, "ground_truth": 0}, {"key": "30972362", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049958524651181814, "ground_truth": 0}, {"key": "30972362", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15921740256602412, "ground_truth": 0}, {"key": "30972362", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24508500920821047, "ground_truth": 0}, {"key": "30972362", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259841211797, "ground_truth": 0}, {"key": "30972362", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1183851033125647, "ground_truth": 0}, {"key": "36380943", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04637820576668747, "ground_truth": 0}, {"key": "36380943", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.022977368828290528, "ground_truth": 0}, {"key": "36380943", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05834584019111823, "ground_truth": 0}, {"key": "36380943", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.025760560551380072, "ground_truth": 0}, {"key": "36380943", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06489011277743853, "ground_truth": 0}, {"key": "36929355", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07423136595198823, "ground_truth": 0}, {"key": "36929355", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10669059173183185, "ground_truth": 0}, {"key": "36929355", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05146276607876649, "ground_truth": 0}, {"key": "36929355", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05340333445086281, "ground_truth": 0}, {"key": "36929355", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.039048291545605934, "ground_truth": 0}, {"key": "39127206", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13296424906231924, "ground_truth": 0}, {"key": "39127206", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020410308001339333, "ground_truth": 0}, {"key": "39127206", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.049589022441268844, "ground_truth": 0}, {"key": "39127206", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002881613048447, "ground_truth": 0}, {"key": "39127206", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14463143938651776, "ground_truth": 0}, {"key": "36128318", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20689405967897176, "ground_truth": 0}, {"key": "36128318", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.142231892078846, "ground_truth": 0}, {"key": "36128318", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25982564242812867, "ground_truth": 0}, {"key": "36128318", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.209469692366631, "ground_truth": 0}, {"key": "36128318", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610490111986627, "ground_truth": 0}, {"key": "39863480", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10894504184027108, "ground_truth": 0}, {"key": "39863480", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03461884243673968, "ground_truth": 0}, {"key": "39863480", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03890198252755801, "ground_truth": 0}, {"key": "39863480", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.019643759744949557, "ground_truth": 0}, {"key": "39863480", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07504072228338625, "ground_truth": 0}, {"key": "38634057", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27202455718051816, "ground_truth": 0}, {"key": "38634057", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.29992476665486173, "ground_truth": 0}, {"key": "38634057", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.34246157459628934, "ground_truth": 0}, {"key": "38634057", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3157359814839193, "ground_truth": 0}, {"key": "38634057", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2531218244397741, "ground_truth": 0}, {"key": "33131935", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12378868498477494, "ground_truth": 0}, {"key": "33131935", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02096423936668893, "ground_truth": 0}, {"key": "33131935", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03514484526304389, "ground_truth": 0}, {"key": "33131935", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04535258262228263, "ground_truth": 0}, {"key": "33131935", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03138043247257452, "ground_truth": 0}, {"key": "39021319", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5253688279755596, "ground_truth": 0}, {"key": "39021319", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.39981167308839843, "ground_truth": 0}, {"key": "39021319", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.859663749333228, "ground_truth": 0}, {"key": "39021319", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368374405961, "ground_truth": 0}, {"key": "39021319", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742627312351485, "ground_truth": 0}, {"key": "40644571", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14804718937859443, "ground_truth": 0}, {"key": "40644571", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16132023344702792, "ground_truth": 0}, {"key": "40644571", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06371499799947578, "ground_truth": 0}, {"key": "40644571", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11556087308560835, "ground_truth": 0}, {"key": "40644571", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.108566422407923, "ground_truth": 0}, {"key": "14681877", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713685649884204, "ground_truth": 0}, {"key": "14681877", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07585818083283472, "ground_truth": 0}, {"key": "14681877", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1403362458568988, "ground_truth": 0}, {"key": "14681877", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19868534296543056, "ground_truth": 0}, {"key": "14681877", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0499585233587355, "ground_truth": 0}, {"key": "36570890", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031979562229622664, "ground_truth": 0}, {"key": "36570890", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03461883998543574, "ground_truth": 0}, {"key": "36570890", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.028870908112248916, "ground_truth": 0}, {"key": "36570890", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.017375665453850945, "ground_truth": 0}, {"key": "36570890", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08269734321673715, "ground_truth": 0}, {"key": "30452755", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0123361013541777, "ground_truth": 0}, {"key": "30452755", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03321117011152791, "ground_truth": 0}, {"key": "30452755", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.015784562015393508, "ground_truth": 0}, {"key": "30452755", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.011597361151818959, "ground_truth": 0}, {"key": "30452755", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.014117892862979872, "ground_truth": 0}, {"key": "37347053", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03333682507668553, "ground_truth": 0}, {"key": "37347053", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0566524226596315, "ground_truth": 0}, {"key": "37347053", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025565213618665265, "ground_truth": 0}, {"key": "37347053", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15817434841338973, "ground_truth": 0}, {"key": "37347053", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11596070927010473, "ground_truth": 0}, {"key": "38890979", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04304285139566846, "ground_truth": 0}, {"key": "38890979", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0512724220587862, "ground_truth": 0}, {"key": "38890979", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03044434865553368, "ground_truth": 0}, {"key": "38890979", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.035948322493547874, "ground_truth": 0}, {"key": "38890979", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05686155343314876, "ground_truth": 0}, {"key": "32974694", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0780781659982751, "ground_truth": 0}, {"key": "32974694", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1824255292551004, "ground_truth": 0}, {"key": "32974694", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.024609928235920734, "ground_truth": 0}, {"key": "32974694", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14511536403185352, "ground_truth": 0}, {"key": "32974694", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040237944912460605, "ground_truth": 0}, {"key": "38519940", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5039061699271454, "ground_truth": 0}, {"key": "38519940", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17217185789435954, "ground_truth": 0}, {"key": "38519940", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3259495272459042, "ground_truth": 0}, {"key": "38519940", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2751297143983467, "ground_truth": 0}, {"key": "38519940", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015324032869, "ground_truth": 0}, {"key": "38870104", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.023065226253169323, "ground_truth": 0}, {"key": "38870104", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.039195133815009664, "ground_truth": 0}, {"key": "38870104", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0194938727559785, "ground_truth": 0}, {"key": "38870104", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0589930330978228, "ground_truth": 0}, {"key": "38870104", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.021864557613293163, "ground_truth": 0}, {"key": "34283161", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.057071399221891785, "ground_truth": 0}, {"key": "34283161", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04885777744371892, "ground_truth": 0}, {"key": "34283161", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.028436033075892812, "ground_truth": 0}, {"key": "34283161", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436852323715664, "ground_truth": 0}, {"key": "34283161", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.84695783744677, "ground_truth": 0}, {"key": "31650463", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031738591321771065, "ground_truth": 0}, {"key": "31650463", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03890198105369456, "ground_truth": 0}, {"key": "31650463", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01949387155810376, "ground_truth": 0}, {"key": "31650463", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03435868904097798, "ground_truth": 0}, {"key": "31650463", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012920472091649284, "ground_truth": 0}, {"key": "35589432", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2538610125999374, "ground_truth": 0}, {"key": "35589432", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7041601552017825, "ground_truth": 0}, {"key": "35589432", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2689414389510237, "ground_truth": 0}, {"key": "35589432", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026602847032811, "ground_truth": 0}, {"key": "35589432", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06560483396770274, "ground_truth": 0}, {"key": "14412752", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5621765079194546, "ground_truth": 0}, {"key": "14412752", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5448014011825416, "ground_truth": 0}, {"key": "14412752", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2538610158543364, "ground_truth": 0}, {"key": "14412752", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.462958616483604, "ground_truth": 0}, {"key": "14412752", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435837772746046, "ground_truth": 0}, {"key": "37271183", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35756751814182014, "ground_truth": 0}, {"key": "37271183", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4707365923593553, "ground_truth": 0}, {"key": "37271183", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3979384208171207, "ground_truth": 0}, {"key": "37271183", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734880561308, "ground_truth": 0}, {"key": "37271183", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.276690516801266, "ground_truth": 0}, {"key": "35588153", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0875638406537283, "ground_truth": 0}, {"key": "35588153", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05665242693073718, "ground_truth": 0}, {"key": "35588153", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11838509641827806, "ground_truth": 0}, {"key": "35588153", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.051845469914977106, "ground_truth": 0}, {"key": "35588153", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1393963799327633, "ground_truth": 0}, {"key": "39876692", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3575675098622019, "ground_truth": 0}, {"key": "39876692", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0695417450985858, "ground_truth": 0}, {"key": "39876692", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2877678166521294, "ground_truth": 0}, {"key": "39876692", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730087324044, "ground_truth": 0}, {"key": "39876692", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.34158250854598043, "ground_truth": 0}, {"key": "38992323", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02262919932074024, "ground_truth": 0}, {"key": "38992323", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.023153410141879414, "ground_truth": 0}, {"key": "38992323", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0764076792387002, "ground_truth": 0}, {"key": "38992323", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.058131594661917675, "ground_truth": 0}, {"key": "38992323", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02033235216889131, "ground_truth": 0}, {"key": "37556002", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06325052587905089, "ground_truth": 0}, {"key": "37556002", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2861692640726762, "ground_truth": 0}, {"key": "37556002", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09807932826873643, "ground_truth": 0}, {"key": "37556002", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678070866962, "ground_truth": 0}, {"key": "37556002", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106118660794126, "ground_truth": 0}, {"key": "39875801", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.051845468071818945, "ground_truth": 0}, {"key": "39875801", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.014227046110222753, "ground_truth": 0}, {"key": "39875801", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14175599234924954, "ground_truth": 0}, {"key": "39875801", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020964240412175546, "ground_truth": 0}, {"key": "39875801", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05146276747004663, "ground_truth": 0}, {"key": "39272285", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.602061587735639, "ground_truth": 0}, {"key": "39272285", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.904650541987677, "ground_truth": 0}, {"key": "39272285", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3468730649575405, "ground_truth": 0}, {"key": "39272285", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106118515991314, "ground_truth": 0}, {"key": "39272285", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06560483159543595, "ground_truth": 0}, {"key": "39629714", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0718512733422196, "ground_truth": 0}, {"key": "39629714", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03090895908540333, "ground_truth": 0}, {"key": "39629714", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04867656912895046, "ground_truth": 0}, {"key": "39629714", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08122775417109158, "ground_truth": 0}, {"key": "39629714", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07263670658747674, "ground_truth": 0}, {"key": "34043257", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03875619574785167, "ground_truth": 0}, {"key": "34043257", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01883313060843904, "ground_truth": 0}, {"key": "34043257", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013532148811541207, "ground_truth": 0}, {"key": "34043257", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009485713944379063, "ground_truth": 0}, {"key": "34043257", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018833130652380126, "ground_truth": 0}, {"key": "33995240", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.022802637597124017, "ground_truth": 0}, {"key": "33995240", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05964693807409525, "ground_truth": 0}, {"key": "33995240", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09912085456559291, "ground_truth": 0}, {"key": "33995240", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016277460529908205, "ground_truth": 0}, {"key": "33995240", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04240382572717133, "ground_truth": 0}, {"key": "39399948", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6636689611582447, "ground_truth": 0}, {"key": "39399948", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.407333404089634, "ground_truth": 0}, {"key": "39399948", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3040416794772665, "ground_truth": 0}, {"key": "39399948", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632712846042, "ground_truth": 0}, {"key": "39399948", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220564821072113, "ground_truth": 0}, {"key": "33185890", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.008219692860128126, "ground_truth": 0}, {"key": "33185890", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01536534258070159, "ground_truth": 0}, {"key": "33185890", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013795364169501686, "ground_truth": 0}, {"key": "33185890", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01737566549104896, "ground_truth": 0}, {"key": "33185890", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.030444350561018827, "ground_truth": 0}, {"key": "35280425", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12506538444710621, "ground_truth": 0}, {"key": "35280425", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18713267743132178, "ground_truth": 0}, {"key": "35280425", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24364245647476418, "ground_truth": 0}, {"key": "35280425", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567987056296, "ground_truth": 0}, {"key": "35280425", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328821013485826, "ground_truth": 0}, {"key": "16365170", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09807932737203966, "ground_truth": 0}, {"key": "16365170", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15610490622355902, "ground_truth": 0}, {"key": "16365170", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10374862519371014, "ground_truth": 0}, {"key": "16365170", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03934250390792611, "ground_truth": 0}, {"key": "16365170", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06705628872171583, "ground_truth": 0}, {"key": "24388238", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4629586061444774, "ground_truth": 0}, {"key": "24388238", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8940517187032843, "ground_truth": 0}, {"key": "24388238", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8479677593442301, "ground_truth": 0}, {"key": "24388238", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504744328457, "ground_truth": 0}, {"key": "24388238", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9872772917868761, "ground_truth": 0}, {"key": "35024827", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05165378230549387, "ground_truth": 0}, {"key": "35024827", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06681232313784012, "ground_truth": 0}, {"key": "35024827", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09235979551017721, "ground_truth": 0}, {"key": "35024827", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016340127711716716, "ground_truth": 0}, {"key": "35024827", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0897732858741709, "ground_truth": 0}, {"key": "38624944", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07751765937185302, "ground_truth": 0}, {"key": "38624944", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.040540737072461606, "ground_truth": 0}, {"key": "38624944", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04468087078712923, "ground_truth": 0}, {"key": "38624944", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.028220986395444125, "ground_truth": 0}, {"key": "38624944", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.029760093298481508, "ground_truth": 0}, {"key": "34719830", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19193280145811112, "ground_truth": 0}, {"key": "34719830", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1955940793171462, "ground_truth": 0}, {"key": "34719830", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20817892983229555, "ground_truth": 0}, {"key": "34719830", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580095381165, "ground_truth": 0}, {"key": "34719830", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510839396188327, "ground_truth": 0}, {"key": "38995225", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3684056968157022, "ground_truth": 0}, {"key": "38995225", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4244119964754139, "ground_truth": 0}, {"key": "38995225", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6020615778434403, "ground_truth": 0}, {"key": "38995225", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15102780234877186, "ground_truth": 0}, {"key": "38995225", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804740496002, "ground_truth": 0}, {"key": "34242311", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713685624962223, "ground_truth": 0}, {"key": "34242311", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012527934320559514, "ground_truth": 0}, {"key": "34242311", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027901379328306986, "ground_truth": 0}, {"key": "34242311", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0577053133414265, "ground_truth": 0}, {"key": "34242311", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.021287351311621194, "ground_truth": 0}, {"key": "39253748", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5851011729789098, "ground_truth": 0}, {"key": "39253748", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33111974595183175, "ground_truth": 0}, {"key": "39253748", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6926419878685809, "ground_truth": 0}, {"key": "39253748", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311862016101, "ground_truth": 0}, {"key": "39253748", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076629413161718, "ground_truth": 0}, {"key": "37131104", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7859664303475163, "ground_truth": 0}, {"key": "37131104", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6252093027956489, "ground_truth": 0}, {"key": "37131104", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8683809576695051, "ground_truth": 0}, {"key": "37131104", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7082125914899535, "ground_truth": 0}, {"key": "37131104", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577680980748256, "ground_truth": 0}, {"key": "38490554", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03904829133572273, "ground_truth": 0}, {"key": "38490554", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.021287349928348104, "ground_truth": 0}, {"key": "38490554", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04054073790243598, "ground_truth": 0}, {"key": "38490554", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03102617807890965, "ground_truth": 0}, {"key": "38490554", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008511302822032198, "ground_truth": 0}, {"key": "29009500", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20434190447058262, "ground_truth": 0}, {"key": "29009500", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27669052848645226, "ground_truth": 0}, {"key": "29009500", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22000710748497757, "ground_truth": 0}, {"key": "29009500", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667160561101994, "ground_truth": 0}, {"key": "29009500", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15102780525830303, "ground_truth": 0}, {"key": "36703057", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11920292064944835, "ground_truth": 0}, {"key": "36703057", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20307461824638423, "ground_truth": 0}, {"key": "36703057", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19436781928633717, "ground_truth": 0}, {"key": "36703057", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864513172442746, "ground_truth": 0}, {"key": "36703057", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074558490279646, "ground_truth": 0}, {"key": "34876987", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1943678226435525, "ground_truth": 0}, {"key": "34876987", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06656918896469642, "ground_truth": 0}, {"key": "34876987", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09602549171182871, "ground_truth": 0}, {"key": "34876987", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03161876757170898, "ground_truth": 0}, {"key": "34876987", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04535257938164317, "ground_truth": 0}, {"key": "36209258", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09670579038701776, "ground_truth": 0}, {"key": "36209258", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03817827608517641, "ground_truth": 0}, {"key": "36209258", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.028114056390203947, "ground_truth": 0}, {"key": "36209258", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05281402367551202, "ground_truth": 0}, {"key": "36209258", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0761324758941954, "ground_truth": 0}, {"key": "36854437", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15304216052274433, "ground_truth": 0}, {"key": "36854437", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18713269673782781, "ground_truth": 0}, {"key": "36854437", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07477004632939971, "ground_truth": 0}, {"key": "36854437", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07807816313789652, "ground_truth": 0}, {"key": "36854437", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733752333997666, "ground_truth": 0}, {"key": "38047723", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23510838523583763, "ground_truth": 0}, {"key": "38047723", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20689405407882538, "ground_truth": 0}, {"key": "38047723", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24798742786952363, "ground_truth": 0}, {"key": "38047723", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310345914705, "ground_truth": 0}, {"key": "38047723", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682619822804723, "ground_truth": 0}, {"key": "34287816", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014117893103565092, "ground_truth": 0}, {"key": "34287816", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.004468384501529864, "ground_truth": 0}, {"key": "34287816", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05500528403152131, "ground_truth": 0}, {"key": "34287816", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.023962026634539727, "ground_truth": 0}, {"key": "34287816", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.022201227245947208, "ground_truth": 0}, {"key": "33235855", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07892588157092614, "ground_truth": 0}, {"key": "33235855", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06928941316448783, "ground_truth": 0}, {"key": "33235855", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1895211004433038, "ground_truth": 0}, {"key": "33235855", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0869416575082481, "ground_truth": 0}, {"key": "33235855", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421301326453746, "ground_truth": 0}, {"key": "34381016", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24508501086670542, "ground_truth": 0}, {"key": "34381016", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25386101217673124, "ground_truth": 0}, {"key": "34381016", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08694166379614596, "ground_truth": 0}, {"key": "34381016", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436852583169328, "ground_truth": 0}, {"key": "34381016", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08181271607105632, "ground_truth": 0}, {"key": "28064995", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17553806891790685, "ground_truth": 0}, {"key": "28064995", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12592277266428312, "ground_truth": 0}, {"key": "28064995", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20561504016607876, "ground_truth": 0}, {"key": "28064995", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2689414351013762, "ground_truth": 0}, {"key": "28064995", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667161514694812, "ground_truth": 0}, {"key": "37576197", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014063626418557377, "ground_truth": 0}, {"key": "37576197", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06903793051460272, "ground_truth": 0}, {"key": "37576197", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04569203020116439, "ground_truth": 0}, {"key": "37576197", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07807815760608942, "ground_truth": 0}, {"key": "37576197", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08632347720983735, "ground_truth": 0}, {"key": "34454741", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.026556573127698505, "ground_truth": 0}, {"key": "34454741", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.008644178272347694, "ground_truth": 0}, {"key": "34454741", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04958902583508957, "ground_truth": 0}, {"key": "34454741", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07211219972243176, "ground_truth": 0}, {"key": "34454741", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016340128252243544, "ground_truth": 0}, {"key": "34766970", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4130035582571486, "ground_truth": 0}, {"key": "34766970", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.39233684148473463, "ground_truth": 0}, {"key": "34766970", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.40544872768745444, "ground_truth": 0}, {"key": "34766970", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434189039291348, "ground_truth": 0}, {"key": "34766970", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10521053054740871, "ground_truth": 0}, {"key": "35574186", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.006097561750195438, "ground_truth": 0}, {"key": "35574186", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.008412977369357307, "ground_truth": 0}, {"key": "35574186", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01812472135182016, "ground_truth": 0}, {"key": "35574186", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.00828362660032301, "ground_truth": 0}, {"key": "35574186", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01120121355072952, "ground_truth": 0}, {"key": "35486470", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031979558881594546, "ground_truth": 0}, {"key": "35486470", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.007403014064864907, "ground_truth": 0}, {"key": "35486470", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16238002812791438, "ground_truth": 0}, {"key": "35486470", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05399884061756407, "ground_truth": 0}, {"key": "35486470", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023962024156216906, "ground_truth": 0}, {"key": "40977702", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013532148705823373, "ground_truth": 0}, {"key": "40977702", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17217184707870398, "ground_truth": 0}, {"key": "40977702", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017712298019254172, "ground_truth": 0}, {"key": "40977702", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030908959979732337, "ground_truth": 0}, {"key": "40977702", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0253713112849318, "ground_truth": 0}, {"key": "35336618", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05419873451298277, "ground_truth": 0}, {"key": "35336618", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0073173977086597505, "ground_truth": 0}, {"key": "35336618", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.008348053878590288, "ground_truth": 0}, {"key": "35336618", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0195686760783393, "ground_truth": 0}, {"key": "35336618", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06954174247455802, "ground_truth": 0}, {"key": "33024679", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12592276384557763, "ground_truth": 0}, {"key": "33024679", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07585817852201339, "ground_truth": 0}, {"key": "33024679", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.36477757492611596, "ground_truth": 0}, {"key": "33024679", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263670377282988, "ground_truth": 0}, {"key": "33024679", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804778999549, "ground_truth": 0}, {"key": "37451334", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2674081681590685, "ground_truth": 0}, {"key": "37451334", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09203286377366744, "ground_truth": 0}, {"key": "37451334", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.35398630630782424, "ground_truth": 0}, {"key": "37451334", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2160115381026664, "ground_truth": 0}, {"key": "37451334", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643868647177, "ground_truth": 0}, {"key": "33354824", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2991051870574212, "ground_truth": 0}, {"key": "33354824", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03649376587987372, "ground_truth": 0}, {"key": "33354824", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30074559159571423, "ground_truth": 0}, {"key": "33354824", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08035746859963813, "ground_truth": 0}, {"key": "33354824", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3191213797924337, "ground_truth": 0}, {"key": "34688538", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07558478806882762, "ground_truth": 0}, {"key": "34688538", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06804042037354197, "ground_truth": 0}, {"key": "34688538", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.023962024839298338, "ground_truth": 0}, {"key": "34688538", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08819004459908542, "ground_truth": 0}, {"key": "34688538", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.036493766687384535, "ground_truth": 0}, {"key": "33646276", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36840571024105156, "ground_truth": 0}, {"key": "33646276", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2974699634643544, "ground_truth": 0}, {"key": "33646276", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22270012996223396, "ground_truth": 0}, {"key": "33646276", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19744446363667642, "ground_truth": 0}, {"key": "33646276", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06512754860204273, "ground_truth": 0}, {"key": "40322608", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03210070826436604, "ground_truth": 0}, {"key": "40322608", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.042882240671149, "ground_truth": 0}, {"key": "40322608", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07864238411166681, "ground_truth": 0}, {"key": "40322608", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013020489952886708, "ground_truth": 0}, {"key": "40322608", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03474962811065686, "ground_truth": 0}, {"key": "39565762", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04288224312077228, "ground_truth": 0}, {"key": "39565762", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04831607417675872, "ground_truth": 0}, {"key": "39565762", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0216153322185863, "ground_truth": 0}, {"key": "39565762", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0556176120437428, "ground_truth": 0}, {"key": "39565762", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06754669590161161, "ground_truth": 0}, {"key": "30534259", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15817435151762432, "ground_truth": 0}, {"key": "30534259", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03541072730349973, "ground_truth": 0}, {"key": "30534259", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11596071070656383, "ground_truth": 0}, {"key": "30534259", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10669059770891381, "ground_truth": 0}, {"key": "30534259", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08210663228679603, "ground_truth": 0}, {"key": "39644242", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03448852431716632, "ground_truth": 0}, {"key": "39644242", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05261895539740935, "ground_truth": 0}, {"key": "39644242", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04115288694336717, "ground_truth": 0}, {"key": "39644242", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09807932222321811, "ground_truth": 0}, {"key": "39644242", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08725224452493018, "ground_truth": 0}, {"key": "19853740", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14903530334890003, "ground_truth": 0}, {"key": "19853740", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15507846257669586, "ground_truth": 0}, {"key": "19853740", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18359362580177294, "ground_truth": 0}, {"key": "19853740", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223188807904438, "ground_truth": 0}, {"key": "19853740", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10447732062550452, "ground_truth": 0}, {"key": "33023078", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31912138273960583, "ground_truth": 0}, {"key": "33023078", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.040237942542110744, "ground_truth": 0}, {"key": "33023078", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1561048985478844, "ground_truth": 0}, {"key": "33023078", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0894546015121337, "ground_truth": 0}, {"key": "33023078", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13986565103294707, "ground_truth": 0}, {"key": "38329806", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07211219937094764, "ground_truth": 0}, {"key": "38329806", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14033624719339913, "ground_truth": 0}, {"key": "38329806", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13477592097599952, "ground_truth": 0}, {"key": "38329806", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09073549283750088, "ground_truth": 0}, {"key": "38329806", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1550784703888337, "ground_truth": 0}, {"key": "38761942", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8577681137289228, "ground_truth": 0}, {"key": "38761942", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.844921527999552, "ground_truth": 0}, {"key": "38761942", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8333246026928284, "ground_truth": 0}, {"key": "38761942", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300522706499, "ground_truth": 0}, {"key": "38761942", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282922466778, "ground_truth": 0}, {"key": "33773576", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013070784312348547, "ground_truth": 0}, {"key": "33773576", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10374862995992726, "ground_truth": 0}, {"key": "33773576", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013902059174537441, "ground_truth": 0}, {"key": "33773576", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009596455030070157, "ground_truth": 0}, {"key": "33773576", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03435868926936602, "ground_truth": 0}, {"key": "37642631", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14511536359712254, "ground_truth": 0}, {"key": "37642631", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05921025657931878, "ground_truth": 0}, {"key": "37642631", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13028542373418586, "ground_truth": 0}, {"key": "37642631", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08269733787007559, "ground_truth": 0}, {"key": "37642631", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09877259005686198, "ground_truth": 0}, {"key": "36609836", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14414886034404467, "ground_truth": 0}, {"key": "36609836", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2465333364620978, "ground_truth": 0}, {"key": "36609836", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16559312092455306, "ground_truth": 0}, {"key": "36609836", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06608537897312153, "ground_truth": 0}, {"key": "36609836", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11516223536591041, "ground_truth": 0}, {"key": "41035610", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22270014453559125, "ground_truth": 0}, {"key": "41035610", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05340333409561328, "ground_truth": 0}, {"key": "41035610", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05707140079041982, "ground_truth": 0}, {"key": "41035610", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405756123672357, "ground_truth": 0}, {"key": "41035610", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05791808702353796, "ground_truth": 0}, {"key": "37592684", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.012870748970840305, "ground_truth": 0}, {"key": "37592684", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10087861413492939, "ground_truth": 0}, {"key": "37592684", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18713269032790106, "ground_truth": 0}, {"key": "37592684", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03283695503252528, "ground_truth": 0}, {"key": "37592684", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10230469902836235, "ground_truth": 0}, {"key": "38951040", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.055005281729582925, "ground_truth": 0}, {"key": "38951040", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06164962317230038, "ground_truth": 0}, {"key": "38951040", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10669059957451109, "ground_truth": 0}, {"key": "38951040", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07081619732921113, "ground_truth": 0}, {"key": "38951040", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01737566430098467, "ground_truth": 0}, {"key": "40774469", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0409990289445502, "ground_truth": 0}, {"key": "40774469", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017309097033509697, "ground_truth": 0}, {"key": "40774469", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08787643653305215, "ground_truth": 0}, {"key": "40774469", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07835981154567545, "ground_truth": 0}, {"key": "40774469", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040087356860961716, "ground_truth": 0}, {"key": "40876288", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0697949187493539, "ground_truth": 0}, {"key": "40876288", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.014009567338542384, "ground_truth": 0}, {"key": "40876288", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03371653777034103, "ground_truth": 0}, {"key": "40876288", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.010288301227686727, "ground_truth": 0}, {"key": "40876288", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.009090382932656576, "ground_truth": 0}, {"key": "40340131", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15304215330767665, "ground_truth": 0}, {"key": "40340131", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03875619617196097, "ground_truth": 0}, {"key": "40340131", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1302854200274565, "ground_truth": 0}, {"key": "40340131", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03760863395265107, "ground_truth": 0}, {"key": "40340131", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1451153569364039, "ground_truth": 0}, {"key": "30121591", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10706345553080251, "ground_truth": 0}, {"key": "30121591", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05281402317582361, "ground_truth": 0}, {"key": "30121591", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.044847905187246885, "ground_truth": 0}, {"key": "30121591", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08819004230236455, "ground_truth": 0}, {"key": "30121591", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05070536239750211, "ground_truth": 0}, {"key": "35623366", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.055005284167999005, "ground_truth": 0}, {"key": "35623366", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.006145092118627187, "ground_truth": 0}, {"key": "35623366", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04084571811623365, "ground_truth": 0}, {"key": "35623366", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.026657741224722892, "ground_truth": 0}, {"key": "35623366", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13568953873309816, "ground_truth": 0}, {"key": "41014093", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20434189614339124, "ground_truth": 0}, {"key": "41014093", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1233656232443246, "ground_truth": 0}, {"key": "41014093", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3757064742571285, "ground_truth": 0}, {"key": "41014093", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925953139925934, "ground_truth": 0}, {"key": "41014093", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4687906187320586, "ground_truth": 0}, {"key": "11387984", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05942821660418332, "ground_truth": 0}, {"key": "11387984", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11676401395245298, "ground_truth": 0}, {"key": "11387984", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.26740816234989634, "ground_truth": 0}, {"key": "11387984", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04849600209180946, "ground_truth": 0}, {"key": "11387984", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08210662787770705, "ground_truth": 0}, {"key": "39508312", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03622005843923239, "ground_truth": 0}, {"key": "39508312", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11516222912221015, "ground_truth": 0}, {"key": "39508312", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06954174628873241, "ground_truth": 0}, {"key": "39508312", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14414885279584502, "ground_truth": 0}, {"key": "39508312", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594720842824378, "ground_truth": 0}, {"key": "35815369", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1895210942167447, "ground_truth": 0}, {"key": "35815369", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15405756674375426, "ground_truth": 0}, {"key": "35815369", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21206880168770306, "ground_truth": 0}, {"key": "35815369", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14804718813547213, "ground_truth": 0}, {"key": "35815369", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08632348090178464, "ground_truth": 0}, {"key": "35802823", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.038466192176975694, "ground_truth": 0}, {"key": "35802823", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03875619671802667, "ground_truth": 0}, {"key": "35802823", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026556572134104027, "ground_truth": 0}, {"key": "35802823", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.027066177104600176, "ground_truth": 0}, {"key": "35802823", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.041773878597327244, "ground_truth": 0}, {"key": "38499968", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31573599611079195, "ground_truth": 0}, {"key": "38499968", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10669059109555318, "ground_truth": 0}, {"key": "38499968", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09670579251908015, "ground_truth": 0}, {"key": "38499968", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181321890981596, "ground_truth": 0}, {"key": "38499968", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709669665336, "ground_truth": 0}, {"key": "36926726", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.024053553409641437, "ground_truth": 0}, {"key": "36926726", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0403890678398425, "ground_truth": 0}, {"key": "36926726", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.040389068883487686, "ground_truth": 0}, {"key": "36926726", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0860158753719635, "ground_truth": 0}, {"key": "36926726", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0758581834301868, "ground_truth": 0}, {"key": "40903712", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22953521700295346, "ground_truth": 0}, {"key": "40903712", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2674081581279257, "ground_truth": 0}, {"key": "40903712", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15203224627616482, "ground_truth": 0}, {"key": "40903712", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09670578668478072, "ground_truth": 0}, {"key": "40903712", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12085323619321485, "ground_truth": 0}, {"key": "19614862", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.018264278238193574, "ground_truth": 0}, {"key": "19614862", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05582314087499044, "ground_truth": 0}, {"key": "19614862", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03622005698907047, "ground_truth": 0}, {"key": "19614862", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06954174493582924, "ground_truth": 0}, {"key": "19614862", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0680404218580631, "ground_truth": 0}, {"key": "38861704", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.022977369080483492, "ground_truth": 0}, {"key": "38861704", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.011869121075568142, "ground_truth": 0}, {"key": "38861704", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010328153156973304, "ground_truth": 0}, {"key": "38861704", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009196553115909226, "ground_truth": 0}, {"key": "38861704", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015306355059071967, "ground_truth": 0}, {"key": "34349607", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.29583987501746106, "ground_truth": 0}, {"key": "34349607", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.032836956409050364, "ground_truth": 0}, {"key": "34349607", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07369627153147078, "ground_truth": 0}, {"key": "34349607", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05707140328528401, "ground_truth": 0}, {"key": "34349607", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07751765762707472, "ground_truth": 0}, {"key": "20773800", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.003621685389848245, "ground_truth": 0}, {"key": "20773800", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0036928528505072544, "ground_truth": 0}, {"key": "20773800", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.001889538788103679, "ground_truth": 0}, {"key": "20773800", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0034030054898530125, "ground_truth": 0}, {"key": "20773800", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.005888159207425215, "ground_truth": 0}, {"key": "35545608", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03422932283493625, "ground_truth": 0}, {"key": "35545608", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03258974292583638, "ground_truth": 0}, {"key": "35545608", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.016466175027353414, "ground_truth": 0}, {"key": "35545608", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.011463797711312694, "ground_truth": 0}, {"key": "35545608", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008061992004670372, "ground_truth": 0}, {"key": "37258984", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13206614613387635, "ground_truth": 0}, {"key": "37258984", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16451645149864158, "ground_truth": 0}, {"key": "37258984", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08570927907791362, "ground_truth": 0}, {"key": "37258984", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08269734270546326, "ground_truth": 0}, {"key": "37258984", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07159119992853599, "ground_truth": 0}, {"key": "37274562", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2893716918713314, "ground_truth": 0}, {"key": "37274562", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18952108229005094, "ground_truth": 0}, {"key": "37274562", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4263215990694147, "ground_truth": 0}, {"key": "37274562", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215176065423, "ground_truth": 0}, {"key": "37274562", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434189253004414, "ground_truth": 0}, {"key": "40828068", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0587765619808089, "ground_truth": 0}, {"key": "40828068", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0453525803098242, "ground_truth": 0}, {"key": "40828068", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03622005784175528, "ground_truth": 0}, {"key": "40828068", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.023779982620875138, "ground_truth": 0}, {"key": "40828068", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06853749359847473, "ground_truth": 0}, {"key": "37807180", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36296918142518475, "ground_truth": 0}, {"key": "37807180", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.535098406911129, "ground_truth": 0}, {"key": "37807180", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4960938266519825, "ground_truth": 0}, {"key": "37807180", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191214019255813, "ground_truth": 0}, {"key": "37807180", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6575384333860179, "ground_truth": 0}, {"key": "40748607", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.015845361536474457, "ground_truth": 0}, {"key": "40748607", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08151975481356712, "ground_truth": 0}, {"key": "40748607", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15002882709493812, "ground_truth": 0}, {"key": "40748607", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159119915271368, "ground_truth": 0}, {"key": "40748607", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.009090383217214722, "ground_truth": 0}, {"key": "40123819", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12336561149448196, "ground_truth": 0}, {"key": "40123819", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06608537364482095, "ground_truth": 0}, {"key": "40123819", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0769608367676605, "ground_truth": 0}, {"key": "40123819", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08509904586785329, "ground_truth": 0}, {"key": "40123819", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12852513619326283, "ground_truth": 0}, {"key": "38453867", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4590761257849884, "ground_truth": 0}, {"key": "38453867", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0736962728532533, "ground_truth": 0}, {"key": "38453867", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05261895323589339, "ground_truth": 0}, {"key": "38453867", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689405661662674, "ground_truth": 0}, {"key": "38453867", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09203285600400274, "ground_truth": 0}, {"key": "38944856", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2337063500974562, "ground_truth": 0}, {"key": "38944856", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3665897440721958, "ground_truth": 0}, {"key": "38944856", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14903530266207218, "ground_truth": 0}, {"key": "38944856", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29421497134586416, "ground_truth": 0}, {"key": "38944856", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0857092779070498, "ground_truth": 0}, {"key": "35778898", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1316190381837356, "ground_truth": 0}, {"key": "35778898", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10631887038023508, "ground_truth": 0}, {"key": "35778898", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12168575472800609, "ground_truth": 0}, {"key": "35778898", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1441488461764492, "ground_truth": 0}, {"key": "35778898", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13296424690652106, "ground_truth": 0}, {"key": "32530125", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.059866421658305566, "ground_truth": 0}, {"key": "32530125", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09009299602122343, "ground_truth": 0}, {"key": "32530125", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07477004487004063, "ground_truth": 0}, {"key": "32530125", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07751765654970509, "ground_truth": 0}, {"key": "32530125", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04208772838202915, "ground_truth": 0}, {"key": "35010363", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05419873214836561, "ground_truth": 0}, {"key": "35010363", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.006217077951426027, "ground_truth": 0}, {"key": "35010363", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010489091718988463, "ground_truth": 0}, {"key": "35010363", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022715754792281707, "ground_truth": 0}, {"key": "35010363", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03514484609363736, "ground_truth": 0}, {"key": "27514800", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18952110307976267, "ground_truth": 0}, {"key": "27514800", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04518375341577061, "ground_truth": 0}, {"key": "27514800", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06681233263367825, "ground_truth": 0}, {"key": "27514800", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0600866473814907, "ground_truth": 0}, {"key": "27514800", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08756384216089592, "ground_truth": 0}, {"key": "25725840", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.023153410658066156, "ground_truth": 0}, {"key": "25725840", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.006488269875931045, "ground_truth": 0}, {"key": "25725840", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.020645931590437185, "ground_truth": 0}, {"key": "25725840", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.006850479921744999, "ground_truth": 0}, {"key": "25725840", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015130728237875311, "ground_truth": 0}, {"key": "38327225", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11838510065417317, "ground_truth": 0}, {"key": "38327225", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07477005031339465, "ground_truth": 0}, {"key": "38327225", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11676400613282066, "ground_truth": 0}, {"key": "38327225", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04707418016937749, "ground_truth": 0}, {"key": "38327225", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316471844964112, "ground_truth": 0}, {"key": "11991724", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2553436362612458, "ground_truth": 0}, {"key": "11991724", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19193278932952829, "ground_truth": 0}, {"key": "11991724", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5195213222122602, "ground_truth": 0}, {"key": "11991724", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3830641744084453, "ground_truth": 0}, {"key": "11991724", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643727397085, "ground_truth": 0}, {"key": "32217545", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02120612019571228, "ground_truth": 0}, {"key": "32217545", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04054073580688793, "ground_truth": 0}, {"key": "32217545", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06705628804989748, "ground_truth": 0}, {"key": "32217545", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.025957357787799815, "ground_truth": 0}, {"key": "32217545", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05921024901369739, "ground_truth": 0}, {"key": "12731847", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.018978037053158453, "ground_truth": 0}, {"key": "12731847", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019493870766548432, "ground_truth": 0}, {"key": "12731847", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017576883547344328, "ground_truth": 0}, {"key": "12731847", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013848610379662655, "ground_truth": 0}, {"key": "12731847", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09009299392832064, "ground_truth": 0}, {"key": "36827234", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10818895937971543, "ground_truth": 0}, {"key": "36827234", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08210663393800118, "ground_truth": 0}, {"key": "36827234", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16026602601067744, "ground_truth": 0}, {"key": "36827234", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09739039835556541, "ground_truth": 0}, {"key": "36827234", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11838509760799575, "ground_truth": 0}, {"key": "29111539", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07807815968687319, "ground_truth": 0}, {"key": "29111539", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33285233978199913, "ground_truth": 0}, {"key": "29111539", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08632348062939627, "ground_truth": 0}, {"key": "29111539", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08269734097888493, "ground_truth": 0}, {"key": "29111539", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09877259299331712, "ground_truth": 0}, {"key": "37763052", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0973903969693274, "ground_truth": 0}, {"key": "37763052", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03371654047404956, "ground_truth": 0}, {"key": "37763052", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30239109353066584, "ground_truth": 0}, {"key": "37763052", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0857092745034484, "ground_truth": 0}, {"key": "37763052", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0497734434246921, "ground_truth": 0}, {"key": "30682335", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027901377071897986, "ground_truth": 0}, {"key": "30682335", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02186455674875419, "ground_truth": 0}, {"key": "30682335", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017644464815601082, "ground_truth": 0}, {"key": "30682335", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0809367136353907, "ground_truth": 0}, {"key": "30682335", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.026455776339803526, "ground_truth": 0}, {"key": "12261276", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5945512665731415, "ground_truth": 0}, {"key": "12261276", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2735744005545153, "ground_truth": 0}, {"key": "12261276", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.43590152974490837, "ground_truth": 0}, {"key": "12261276", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.41869692609463877, "ground_truth": 0}, {"key": "12261276", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241612761506, "ground_truth": 0}, {"key": "36912979", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.050705363713053446, "ground_truth": 0}, {"key": "36912979", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.058131591532425635, "ground_truth": 0}, {"key": "36912979", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07921032289719115, "ground_truth": 0}, {"key": "36912979", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.048316073765355926, "ground_truth": 0}, {"key": "36912979", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08006926609464769, "ground_truth": 0}, {"key": "30205259", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03622005937956258, "ground_truth": 0}, {"key": "30205259", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02169809910117788, "ground_truth": 0}, {"key": "30205259", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025858776130430163, "ground_truth": 0}, {"key": "30205259", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013171950338445636, "ground_truth": 0}, {"key": "30205259", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.011961098591112579, "ground_truth": 0}, {"key": "39458032", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15817435492048493, "ground_truth": 0}, {"key": "39458032", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11162799910527467, "ground_truth": 0}, {"key": "39458032", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04958902487096998, "ground_truth": 0}, {"key": "39458032", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10158944796050486, "ground_truth": 0}, {"key": "39458032", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06828853986703581, "ground_truth": 0}, {"key": "35116452", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.015365341807010574, "ground_truth": 0}, {"key": "35116452", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0343586886631263, "ground_truth": 0}, {"key": "35116452", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03435868934653636, "ground_truth": 0}, {"key": "35116452", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01191502259378255, "ground_truth": 0}, {"key": "35116452", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.025565212345450193, "ground_truth": 0}, {"key": "40107476", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04742587088335915, "ground_truth": 0}, {"key": "40107476", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08064662085808263, "ground_truth": 0}, {"key": "40107476", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07211219781595725, "ground_truth": 0}, {"key": "40107476", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11397345939104862, "ground_truth": 0}, {"key": "40107476", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04484790356157788, "ground_truth": 0}, {"key": "39501049", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18242552686214766, "ground_truth": 0}, {"key": "39501049", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06301947247154303, "ground_truth": 0}, {"key": "39501049", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.060751905956339294, "ground_truth": 0}, {"key": "39501049", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06608537667746131, "ground_truth": 0}, {"key": "39501049", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846178938693635, "ground_truth": 0}, {"key": "39642178", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25683200344852075, "ground_truth": 0}, {"key": "39642178", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.055412790596856755, "ground_truth": 0}, {"key": "39642178", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08449275360795566, "ground_truth": 0}, {"key": "39642178", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08945459476727037, "ground_truth": 0}, {"key": "39642178", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017222168297361, "ground_truth": 0}, {"key": "38024796", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1613202410437819, "ground_truth": 0}, {"key": "38024796", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.161320243224021, "ground_truth": 0}, {"key": "38024796", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09401018401031354, "ground_truth": 0}, {"key": "38024796", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12721827525112978, "ground_truth": 0}, {"key": "38024796", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421301123658528, "ground_truth": 0}, {"key": "36652079", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05146276253163729, "ground_truth": 0}, {"key": "36652079", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04603389961727645, "ground_truth": 0}, {"key": "36652079", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027169232145658636, "ground_truth": 0}, {"key": "36652079", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05340333324530165, "ground_truth": 0}, {"key": "36652079", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03358950790702675, "ground_truth": 0}, {"key": "32193402", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04569203340216022, "ground_truth": 0}, {"key": "32193402", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.010091315374113126, "ground_truth": 0}, {"key": "32193402", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06512754934463216, "ground_truth": 0}, {"key": "32193402", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10123348331322339, "ground_truth": 0}, {"key": "32193402", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.047249713235670614, "ground_truth": 0}, {"key": "32589706", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09235979068717856, "ground_truth": 0}, {"key": "32589706", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07640768653336069, "ground_truth": 0}, {"key": "32589706", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.057705314109637786, "ground_truth": 0}, {"key": "32589706", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06489012166891807, "ground_truth": 0}, {"key": "32589706", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017222374814806, "ground_truth": 0}, {"key": "38590589", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010408314505732678, "ground_truth": 0}, {"key": "38590589", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.009268012962198674, "ground_truth": 0}, {"key": "38590589", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03817827741980026, "ground_truth": 0}, {"key": "38590589", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020567095737883862, "ground_truth": 0}, {"key": "38590589", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.011201213995419668, "ground_truth": 0}, {"key": "37045414", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7201715422667807, "ground_truth": 0}, {"key": "37045414", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5039061759222576, "ground_truth": 0}, {"key": "37045414", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5698526545865845, "ground_truth": 0}, {"key": "37045414", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759729630054, "ground_truth": 0}, {"key": "37045414", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881145301853, "ground_truth": 0}, {"key": "33310095", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09704755833539967, "ground_truth": 0}, {"key": "33310095", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07211219479798123, "ground_truth": 0}, {"key": "33310095", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026759283497047304, "ground_truth": 0}, {"key": "33310095", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449275296422805, "ground_truth": 0}, {"key": "33310095", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.044348580890848754, "ground_truth": 0}, {"key": "37934604", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13117322124659092, "ground_truth": 0}, {"key": "37934604", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12252321663883609, "ground_truth": 0}, {"key": "37934604", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12678516775173546, "ground_truth": 0}, {"key": "37934604", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08694166209424994, "ground_truth": 0}, {"key": "37934604", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357958639462681, "ground_truth": 0}, {"key": "39012181", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7853086009891915, "ground_truth": 0}, {"key": "39012181", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6557770145903613, "ground_truth": 0}, {"key": "39012181", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5774953574045162, "ground_truth": 0}, {"key": "39012181", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253729900017, "ground_truth": 0}, {"key": "39012181", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6575384353312113, "ground_truth": 0}, {"key": "40221674", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15102780785088812, "ground_truth": 0}, {"key": "40221674", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20055769076277333, "ground_truth": 0}, {"key": "40221674", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13386748263120854, "ground_truth": 0}, {"key": "40221674", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10818895633393492, "ground_truth": 0}, {"key": "40221674", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208213079883021, "ground_truth": 0}, {"key": "36884862", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04288223904675891, "ground_truth": 0}, {"key": "36884862", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03410042806073203, "ground_truth": 0}, {"key": "36884862", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06928941582051919, "ground_truth": 0}, {"key": "36884862", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.045862666312982504, "ground_truth": 0}, {"key": "36884862", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04552200805971923, "ground_truth": 0}, {"key": "39054429", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09467770480827112, "ground_truth": 0}, {"key": "39054429", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09534945860734961, "ground_truth": 0}, {"key": "39054429", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11596071240014494, "ground_truth": 0}, {"key": "39054429", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09401018339220799, "ground_truth": 0}, {"key": "39054429", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344543298007877, "ground_truth": 0}, {"key": "36753964", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2658804626948749, "ground_truth": 0}, {"key": "36753964", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05707139955880311, "ground_truth": 0}, {"key": "36753964", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5428632601591786, "ground_truth": 0}, {"key": "36753964", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026604164978442, "ground_truth": 0}, {"key": "36753964", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398753548272, "ground_truth": 0}, {"key": "37612459", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.42441198560004545, "ground_truth": 0}, {"key": "37612459", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.30404168741328574, "ground_truth": 0}, {"key": "37612459", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6076631564951404, "ground_truth": 0}, {"key": "37612459", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756752164266664, "ground_truth": 0}, {"key": "37612459", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.253861014483533, "ground_truth": 0}, {"key": "36805789", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06187598553918275, "ground_truth": 0}, {"key": "36805789", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1592174051775304, "ground_truth": 0}, {"key": "36805789", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12294379621217948, "ground_truth": 0}, {"key": "36805789", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08509904214767519, "ground_truth": 0}, {"key": "36805789", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24653334224840662, "ground_truth": 0}, {"key": "12757394", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11124121555290403, "ground_truth": 0}, {"key": "12757394", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06465349214173643, "ground_truth": 0}, {"key": "12757394", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1127953994341337, "ground_truth": 0}, {"key": "12757394", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596072145649812, "ground_truth": 0}, {"key": "12757394", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07585817951779206, "ground_truth": 0}, {"key": "32192542", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3720487941205983, "ground_truth": 0}, {"key": "32192542", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2281565022703808, "ground_truth": 0}, {"key": "32192542", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3106943890000967, "ground_truth": 0}, {"key": "32192542", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3629692009101845, "ground_truth": 0}, {"key": "32192542", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014734322141485, "ground_truth": 0}, {"key": "34856060", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2925953136032988, "ground_truth": 0}, {"key": "34856060", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.24364244377962765, "ground_truth": 0}, {"key": "34856060", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.31069439495096934, "ground_truth": 0}, {"key": "34856060", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689405034154157, "ground_truth": 0}, {"key": "34856060", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15974102110560628, "ground_truth": 0}, {"key": "36083416", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2704802192721081, "ground_truth": 0}, {"key": "36083416", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2877678244794119, "ground_truth": 0}, {"key": "36083416", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21337717626237826, "ground_truth": 0}, {"key": "36083416", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2766905140060904, "ground_truth": 0}, {"key": "36083416", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573596226549816, "ground_truth": 0}, {"key": "33839050", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1063188755633446, "ground_truth": 0}, {"key": "33839050", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.022371458482444952, "ground_truth": 0}, {"key": "33839050", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017917344681123906, "ground_truth": 0}, {"key": "33839050", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06560483488049434, "ground_truth": 0}, {"key": "33839050", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027376489123530846, "ground_truth": 0}, {"key": "18464690", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.022286185745529433, "ground_truth": 0}, {"key": "18464690", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.015247590355875997, "ground_truth": 0}, {"key": "18464690", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013171950829291451, "ground_truth": 0}, {"key": "18464690", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.011419614847127304, "ground_truth": 0}, {"key": "18464690", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.004681822916496374, "ground_truth": 0}, {"key": "39212665", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16995623188492973, "ground_truth": 0}, {"key": "39212665", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20307463141564044, "ground_truth": 0}, {"key": "39212665", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22541661216893194, "ground_truth": 0}, {"key": "39212665", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002882438579693, "ground_truth": 0}, {"key": "39212665", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12765262139794825, "ground_truth": 0}, {"key": "40094011", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021044565998141515, "ground_truth": 0}, {"key": "40094011", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01228859697891073, "ground_truth": 0}, {"key": "40094011", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.043365800417610796, "ground_truth": 0}, {"key": "40094011", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024987794989177067, "ground_truth": 0}, {"key": "40094011", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02017731819173069, "ground_truth": 0}, {"key": "36036272", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5136684552152919, "ground_truth": 0}, {"key": "36036272", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.44167303291302634, "ground_truth": 0}, {"key": "36036272", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2465333502491696, "ground_truth": 0}, {"key": "36036272", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640184084072, "ground_truth": 0}, {"key": "36036272", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964270023883, "ground_truth": 0}, {"key": "30681904", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02048855498500138, "ground_truth": 0}, {"key": "30681904", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017986210652896583, "ground_truth": 0}, {"key": "30681904", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017309096825158077, "ground_truth": 0}, {"key": "30681904", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02423763475373284, "ground_truth": 0}, {"key": "30681904", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.044680872929555214, "ground_truth": 0}, {"key": "27834240", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10087862301643968, "ground_truth": 0}, {"key": "27834240", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3942009476013786, "ground_truth": 0}, {"key": "27834240", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.38676342513814826, "ground_truth": 0}, {"key": "27834240", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583986268027884, "ground_truth": 0}, {"key": "27834240", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31912139634008785, "ground_truth": 0}, {"key": "35025075", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17441027959415417, "ground_truth": 0}, {"key": "35025075", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20817893451681568, "ground_truth": 0}, {"key": "35025075", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18713267728673633, "ground_truth": 0}, {"key": "35025075", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2227001464530909, "ground_truth": 0}, {"key": "35025075", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.045692036281692563, "ground_truth": 0}, {"key": "33316985", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19930801337241136, "ground_truth": 0}, {"key": "33316985", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09670578899167065, "ground_truth": 0}, {"key": "33316985", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0670562911036579, "ground_truth": 0}, {"key": "33316985", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516223396941697, "ground_truth": 0}, {"key": "33316985", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687307564220177, "ground_truth": 0}, {"key": "17037056", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027376490157327342, "ground_truth": 0}, {"key": "17037056", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.103748630069992, "ground_truth": 0}, {"key": "17037056", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03185885655261268, "ground_truth": 0}, {"key": "17037056", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.036493767048401723, "ground_truth": 0}, {"key": "17037056", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.048136768918331255, "ground_truth": 0}, {"key": "34050457", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04552200662879777, "ground_truth": 0}, {"key": "34050457", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.023065225766194956, "ground_truth": 0}, {"key": "34050457", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03149938223456145, "ground_truth": 0}, {"key": "34050457", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06325052539478103, "ground_truth": 0}, {"key": "34050457", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09170696878596393, "ground_truth": 0}, {"key": "34713745", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07949570219508534, "ground_truth": 0}, {"key": "34713745", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08035746507359087, "ground_truth": 0}, {"key": "34713745", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0920328632392535, "ground_truth": 0}, {"key": "34713745", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12252321442971728, "ground_truth": 0}, {"key": "34713745", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07159120271361655, "ground_truth": 0}, {"key": "40856210", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10970577291439215, "ground_truth": 0}, {"key": "40856210", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10631887642477307, "ground_truth": 0}, {"key": "40856210", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07185126659160497, "ground_truth": 0}, {"key": "40856210", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1052105399156736, "ground_truth": 0}, {"key": "40856210", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13614831311507625, "ground_truth": 0}, {"key": "40848302", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04586266764856287, "ground_truth": 0}, {"key": "40848302", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.023241926811997323, "ground_truth": 0}, {"key": "40848302", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.022457055918876114, "ground_truth": 0}, {"key": "40848302", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04586266365255466, "ground_truth": 0}, {"key": "40848302", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0405407403798174, "ground_truth": 0}, {"key": "40636168", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19193278762493646, "ground_truth": 0}, {"key": "40636168", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5583269794397094, "ground_truth": 0}, {"key": "40636168", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24944722360014063, "ground_truth": 0}, {"key": "40636168", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27357438628261305, "ground_truth": 0}, {"key": "40636168", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13206615657478948, "ground_truth": 0}, {"key": "34423311", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1561048956616987, "ground_truth": 0}, {"key": "34423311", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04518375744014521, "ground_truth": 0}, {"key": "34423311", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23792989676753518, "ground_truth": 0}, {"key": "34423311", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1104711404240596, "ground_truth": 0}, {"key": "34423311", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1980641715889472, "ground_truth": 0}, {"key": "34833945", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03435868912013748, "ground_truth": 0}, {"key": "34833945", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02433019074857451, "ground_truth": 0}, {"key": "34833945", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.044514431021455414, "ground_truth": 0}, {"key": "34833945", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11476478222824935, "ground_truth": 0}, {"key": "34833945", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05986641344838447, "ground_truth": 0}, {"key": "21272328", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09301679910441618, "ground_truth": 0}, {"key": "21272328", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09105828354856692, "ground_truth": 0}, {"key": "21272328", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0963651080564553, "ground_truth": 0}, {"key": "21272328", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12336562662241188, "ground_truth": 0}, {"key": "21272328", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14223189223173763, "ground_truth": 0}, {"key": "38648957", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17441027885812901, "ground_truth": 0}, {"key": "38648957", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09670579085742638, "ground_truth": 0}, {"key": "38648957", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1015894430595158, "ground_truth": 0}, {"key": "38648957", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09877258574516659, "ground_truth": 0}, {"key": "38648957", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12378868714520307, "ground_truth": 0}, {"key": "24942981", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06903792801301785, "ground_truth": 0}, {"key": "24942981", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07004896129480252, "ground_truth": 0}, {"key": "24942981", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1470645244084135, "ground_truth": 0}, {"key": "24942981", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447731749747748, "ground_truth": 0}, {"key": "24942981", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.28457600360182095, "ground_truth": 0}, {"key": "35882366", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1581743575058752, "ground_truth": 0}, {"key": "35882366", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16238002967928705, "ground_truth": 0}, {"key": "35882366", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.28937170518332905, "ground_truth": 0}, {"key": "35882366", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09235979736744736, "ground_truth": 0}, {"key": "35882366", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14128141758385307, "ground_truth": 0}, {"key": "40559523", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10894504379662871, "ground_truth": 0}, {"key": "40559523", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02423763471524669, "ground_truth": 0}, {"key": "40559523", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19806417160614564, "ground_truth": 0}, {"key": "40559523", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203224502781135, "ground_truth": 0}, {"key": "40559523", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14706452897909428, "ground_truth": 0}, {"key": "24632722", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01724277713666073, "ground_truth": 0}, {"key": "24632722", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00470006053473994, "ground_truth": 0}, {"key": "24632722", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0037800955064659983, "ground_truth": 0}, {"key": "24632722", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.007606671691490732, "ground_truth": 0}, {"key": "24632722", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0034834244235782703, "ground_truth": 0}, {"key": "36002759", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013689477544076881, "ground_truth": 0}, {"key": "36002759", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.014957086000284425, "ground_truth": 0}, {"key": "36002759", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03649376660444638, "ground_truth": 0}, {"key": "36002759", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01020905528444049, "ground_truth": 0}, {"key": "36002759", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.022889840609021172, "ground_truth": 0}, {"key": "29508534", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02865266898752925, "ground_truth": 0}, {"key": "29508534", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.021368886469873016, "ground_truth": 0}, {"key": "29508534", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.042403826650811306, "ground_truth": 0}, {"key": "29508534", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04084571919915045, "ground_truth": 0}, {"key": "29508534", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.043691057037498815, "ground_truth": 0}, {"key": "15631612", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07290026629152699, "ground_truth": 0}, {"key": "15631612", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19930801339638882, "ground_truth": 0}, {"key": "15631612", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05665242434051137, "ground_truth": 0}, {"key": "15631612", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10158944799710776, "ground_truth": 0}, {"key": "15631612", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08359066258158021, "ground_truth": 0}, {"key": "40731892", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.873646659115587, "ground_truth": 0}, {"key": "40731892", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4054487225917193, "ground_truth": 0}, {"key": "40731892", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9795896918443547, "ground_truth": 0}, {"key": "40731892", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9618217265672983, "ground_truth": 0}, {"key": "40731892", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9523973437160757, "ground_truth": 0}, {"key": "35971910", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05602938347273926, "ground_truth": 0}, {"key": "35971910", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1037486272002752, "ground_truth": 0}, {"key": "35971910", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1907240294492644, "ground_truth": 0}, {"key": "35971910", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10818895681539248, "ground_truth": 0}, {"key": "35971910", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04468087292612935, "ground_truth": 0}, {"key": "34428424", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1901218454784686, "ground_truth": 0}, {"key": "34428424", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21076629211106457, "ground_truth": 0}, {"key": "34428424", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2877678026830136, "ground_truth": 0}, {"key": "34428424", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.633410257336712, "ground_truth": 0}, {"key": "34428424", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2774729722321701, "ground_truth": 0}, {"key": "36971005", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16559312018700803, "ground_truth": 0}, {"key": "36971005", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25683200400864714, "ground_truth": 0}, {"key": "36971005", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1859471987020345, "ground_truth": 0}, {"key": "36971005", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17328820375761791, "ground_truth": 0}, {"key": "36971005", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09947021791148442, "ground_truth": 0}, {"key": "34649067", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2583259822053198, "ground_truth": 0}, {"key": "34649067", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6132365642608518, "ground_truth": 0}, {"key": "34649067", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6169358240792657, "ground_truth": 0}, {"key": "34649067", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23934932815784804, "ground_truth": 0}, {"key": "34649067", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30404168453535213, "ground_truth": 0}, {"key": "37355154", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5234203546771643, "ground_truth": 0}, {"key": "37355154", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7476159589983827, "ground_truth": 0}, {"key": "37355154", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5195213191788135, "ground_truth": 0}, {"key": "37355154", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.372048785491218, "ground_truth": 0}, {"key": "37355154", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577487711463657, "ground_truth": 0}, {"key": "38674697", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05877655921886949, "ground_truth": 0}, {"key": "38674697", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06278920817311183, "ground_truth": 0}, {"key": "38674697", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.038466194681891844, "ground_truth": 0}, {"key": "38674697", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.048857780763130715, "ground_truth": 0}, {"key": "38674697", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05108273556492406, "ground_truth": 0}, {"key": "40525767", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6442251188837698, "ground_truth": 0}, {"key": "40525767", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8354835385629769, "ground_truth": 0}, {"key": "40525767", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6943026720791828, "ground_truth": 0}, {"key": "40525767", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786094889694, "ground_truth": 0}, {"key": "40525767", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990474435986, "ground_truth": 0}, {"key": "27165110", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6513548571387314, "ground_truth": 0}, {"key": "27165110", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6242935091087346, "ground_truth": 0}, {"key": "27165110", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7217431988480131, "ground_truth": 0}, {"key": "27165110", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527639874733, "ground_truth": 0}, {"key": "27165110", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737871721926, "ground_truth": 0}, {"key": "35497491", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0967057969579565, "ground_truth": 0}, {"key": "35497491", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04336579667135085, "ground_truth": 0}, {"key": "35497491", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.43590152547547967, "ground_truth": 0}, {"key": "35497491", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13706977705132506, "ground_truth": 0}, {"key": "35497491", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09877258952456379, "ground_truth": 0}, {"key": "40690716", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01854656445489053, "ground_truth": 0}, {"key": "40690716", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019568676084685415, "ground_truth": 0}, {"key": "40690716", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.036220061001036245, "ground_truth": 0}, {"key": "40690716", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.068787288501681, "ground_truth": 0}, {"key": "40690716", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02271575509892874, "ground_truth": 0}, {"key": "34835193", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5907792473554854, "ground_truth": 0}, {"key": "34835193", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7490872293969227, "ground_truth": 0}, {"key": "34835193", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7556369865646264, "ground_truth": 0}, {"key": "34835193", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849511727099, "ground_truth": 0}, {"key": "34835193", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331543888126378, "ground_truth": 0}, {"key": "39471712", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.020645931057987104, "ground_truth": 0}, {"key": "39471712", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0780781601090221, "ground_truth": 0}, {"key": "39471712", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02655657307282351, "ground_truth": 0}, {"key": "39471712", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03258974290058972, "ground_truth": 0}, {"key": "39471712", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.025957357327076783, "ground_truth": 0}, {"key": "39115192", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08945459710267495, "ground_truth": 0}, {"key": "39115192", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09534946180222502, "ground_truth": 0}, {"key": "39115192", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0690379268625293, "ground_truth": 0}, {"key": "39115192", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263670440766365, "ground_truth": 0}, {"key": "39115192", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302442918893423, "ground_truth": 0}, {"key": "23520673", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016529555696297302, "ground_truth": 0}, {"key": "23520673", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005730246586204529, "ground_truth": 0}, {"key": "23520673", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01784873690218777, "ground_truth": 0}, {"key": "23520673", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0072890776188882485, "ground_truth": 0}, {"key": "23520673", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.022286186380113707, "ground_truth": 0}, {"key": "35764233", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08122775867149855, "ground_truth": 0}, {"key": "35764233", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05165378853566939, "ground_truth": 0}, {"key": "35764233", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02072506201508334, "ground_truth": 0}, {"key": "35764233", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024053552920588278, "ground_truth": 0}, {"key": "35764233", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09334687354916989, "ground_truth": 0}, {"key": "35228910", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05261895536647485, "ground_truth": 0}, {"key": "35228910", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03488088813139881, "ground_truth": 0}, {"key": "35228910", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08151975261205369, "ground_truth": 0}, {"key": "35228910", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03258974336644341, "ground_truth": 0}, {"key": "35228910", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04385456524497915, "ground_truth": 0}, {"key": "36795599", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.053799643792269904, "ground_truth": 0}, {"key": "36795599", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.129402730262344, "ground_truth": 0}, {"key": "36795599", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07477004461646844, "ground_truth": 0}, {"key": "36795599", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1361483187467098, "ground_truth": 0}, {"key": "36795599", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05561761151476511, "ground_truth": 0}, {"key": "38641949", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07159120382908306, "ground_truth": 0}, {"key": "38641949", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08240150282256889, "ground_truth": 0}, {"key": "38641949", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09301680329649543, "ground_truth": 0}, {"key": "38641949", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0644176628426921, "ground_truth": 0}, {"key": "38641949", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.087252251023745, "ground_truth": 0}, {"key": "29968443", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02931223076946553, "ground_truth": 0}, {"key": "29968443", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0228898410336694, "ground_truth": 0}, {"key": "29968443", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12168575382532709, "ground_truth": 0}, {"key": "29968443", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04023794342347693, "ground_truth": 0}, {"key": "29968443", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.017309096360487015, "ground_truth": 0}, {"key": "21268042", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0775176590981351, "ground_truth": 0}, {"key": "21268042", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04977344440832106, "ground_truth": 0}, {"key": "21268042", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09807932451637025, "ground_truth": 0}, {"key": "21268042", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1285251406646406, "ground_truth": 0}, {"key": "21268042", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10521053123794331, "ground_truth": 0}, {"key": "26808572", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09602549229146015, "ground_truth": 0}, {"key": "26808572", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15405757067160347, "ground_truth": 0}, {"key": "26808572", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07237402018172213, "ground_truth": 0}, {"key": "26808572", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.047425873237331925, "ground_truth": 0}, {"key": "26808572", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733751031971452, "ground_truth": 0}, {"key": "37829390", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0726367074190428, "ground_truth": 0}, {"key": "37829390", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01584536133821484, "ground_truth": 0}, {"key": "37829390", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07211219982366207, "ground_truth": 0}, {"key": "37829390", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10970577074954656, "ground_truth": 0}, {"key": "37829390", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05921025153176716, "ground_truth": 0}, {"key": "35716045", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0913821088825012, "ground_truth": 0}, {"key": "35716045", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.031499383943550396, "ground_truth": 0}, {"key": "35716045", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07159120416702078, "ground_truth": 0}, {"key": "35716045", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10017221984446915, "ground_truth": 0}, {"key": "35716045", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07558478587337655, "ground_truth": 0}, {"key": "34367070", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.017848738743746834, "ground_truth": 0}, {"key": "34367070", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.030908957752112765, "ground_truth": 0}, {"key": "34367070", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07807816890898224, "ground_truth": 0}, {"key": "34367070", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04885777375426863, "ground_truth": 0}, {"key": "34367070", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09739041111174652, "ground_truth": 0}, {"key": "35239748", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03608394071033151, "ground_truth": 0}, {"key": "35239748", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10017221974078638, "ground_truth": 0}, {"key": "35239748", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08035746611143134, "ground_truth": 0}, {"key": "35239748", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04008735968815492, "ground_truth": 0}, {"key": "35239748", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0888202958038013, "ground_truth": 0}, {"key": "40421370", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02655657288765266, "ground_truth": 0}, {"key": "40421370", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.029760094478177995, "ground_truth": 0}, {"key": "40421370", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0726367060391415, "ground_truth": 0}, {"key": "40421370", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13568954653403828, "ground_truth": 0}, {"key": "40421370", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012431650728642631, "ground_truth": 0}, {"key": "37288396", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22953521287144496, "ground_truth": 0}, {"key": "37288396", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.029423579683579563, "ground_truth": 0}, {"key": "37288396", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1242130082622357, "ground_truth": 0}, {"key": "37288396", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07696084209435067, "ground_truth": 0}, {"key": "37288396", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.033085976574898625, "ground_truth": 0}, {"key": "38903688", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0960254924835131, "ground_truth": 0}, {"key": "38903688", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15610490282098877, "ground_truth": 0}, {"key": "38903688", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09073548159996844, "ground_truth": 0}, {"key": "38903688", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.050330632192543946, "ground_truth": 0}, {"key": "38903688", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07531230993411495, "ground_truth": 0}, {"key": "28071228", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.040845718105500604, "ground_truth": 0}, {"key": "28071228", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.039638841413738246, "ground_truth": 0}, {"key": "28071228", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08601588104162122, "ground_truth": 0}, {"key": "28071228", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06705628876461499, "ground_truth": 0}, {"key": "28071228", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.056236347060443316, "ground_truth": 0}, {"key": "36855834", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06705628694229787, "ground_truth": 0}, {"key": "36855834", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3040416669714897, "ground_truth": 0}, {"key": "36855834", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2267836223482428, "ground_truth": 0}, {"key": "36855834", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757214167929042, "ground_truth": 0}, {"key": "36855834", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451645726287226, "ground_truth": 0}, {"key": "40548717", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12984343377887417, "ground_truth": 0}, {"key": "40548717", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10521052916390819, "ground_truth": 0}, {"key": "40548717", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09877258582410152, "ground_truth": 0}, {"key": "40548717", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.039787810389576544, "ground_truth": 0}, {"key": "40548717", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02333076808464271, "ground_truth": 0}, {"key": "37051175", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11357958488425961, "ground_truth": 0}, {"key": "37051175", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07978201193293576, "ground_truth": 0}, {"key": "37051175", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07107366377701431, "ground_truth": 0}, {"key": "37051175", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06512754540601465, "ground_truth": 0}, {"key": "37051175", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.165593121790853, "ground_truth": 0}, {"key": "38882119", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.059646942713765715, "ground_truth": 0}, {"key": "38882119", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005797400621386192, "ground_truth": 0}, {"key": "38882119", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06187598792243237, "ground_truth": 0}, {"key": "38882119", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06187599022718501, "ground_truth": 0}, {"key": "38882119", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0510827347438402, "ground_truth": 0}, {"key": "19485402", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01342825547811045, "ground_truth": 0}, {"key": "19485402", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04742587306669229, "ground_truth": 0}, {"key": "19485402", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06052938795684832, "ground_truth": 0}, {"key": "19485402", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.050517666107651495, "ground_truth": 0}, {"key": "19485402", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.043691060845294734, "ground_truth": 0}, {"key": "36060907", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.40074936690038276, "ground_truth": 0}, {"key": "36060907", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4668456165742786, "ground_truth": 0}, {"key": "36060907", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5708098988741162, "ground_truth": 0}, {"key": "36060907", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4464947011983057, "ground_truth": 0}, {"key": "36060907", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420093064296996, "ground_truth": 0}, {"key": "24037309", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5331543980958261, "ground_truth": 0}, {"key": "24037309", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.37754064082133526, "ground_truth": 0}, {"key": "24037309", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4980468428914304, "ground_truth": 0}, {"key": "24037309", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552954103388326, "ground_truth": 0}, {"key": "24037309", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438005660894234, "ground_truth": 0}, {"key": "35605805", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24944722846683381, "ground_truth": 0}, {"key": "35605805", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17895589959286048, "ground_truth": 0}, {"key": "35605805", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19436782842580833, "ground_truth": 0}, {"key": "35605805", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315339493798, "ground_truth": 0}, {"key": "35605805", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846179424877916, "ground_truth": 0}, {"key": "17706248", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0032476764569569143, "ground_truth": 0}, {"key": "17706248", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.036493767711240216, "ground_truth": 0}, {"key": "17706248", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.005001672482756849, "ground_truth": 0}, {"key": "17706248", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030559864365540514, "ground_truth": 0}, {"key": "17706248", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.009268013416075672, "ground_truth": 0}, {"key": "36883559", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10302442927178324, "ground_truth": 0}, {"key": "36883559", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03271312524138684, "ground_truth": 0}, {"key": "36883559", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11357958996695658, "ground_truth": 0}, {"key": "36883559", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06536577976430873, "ground_truth": 0}, {"key": "36883559", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.044348579887113895, "ground_truth": 0}, {"key": "32799471", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05223085464656714, "ground_truth": 0}, {"key": "32799471", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02737648888061311, "ground_truth": 0}, {"key": "32799471", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.033211170113137, "ground_truth": 0}, {"key": "32799471", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06441765889845079, "ground_truth": 0}, {"key": "32799471", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.026355354173070642, "ground_truth": 0}, {"key": "34797243", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0933468828234474, "ground_truth": 0}, {"key": "34797243", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12940273150670215, "ground_truth": 0}, {"key": "34797243", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15456733325258132, "ground_truth": 0}, {"key": "34797243", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782568057338238, "ground_truth": 0}, {"key": "34797243", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1655931189197276, "ground_truth": 0}, {"key": "32154876", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0253713122276807, "ground_truth": 0}, {"key": "32154876", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04672495853664636, "ground_truth": 0}, {"key": "32154876", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06804042250667965, "ground_truth": 0}, {"key": "32154876", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03308597660995251, "ground_truth": 0}, {"key": "32154876", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012336101626103558, "ground_truth": 0}, {"key": "37962274", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07316471928528448, "ground_truth": 0}, {"key": "37962274", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04922211419243503, "ground_truth": 0}, {"key": "37962274", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12085323466778876, "ground_truth": 0}, {"key": "37962274", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06536578207623682, "ground_truth": 0}, {"key": "37962274", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10743746583476935, "ground_truth": 0}, {"key": "35574030", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07807815869897775, "ground_truth": 0}, {"key": "35574030", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.040389069166180264, "ground_truth": 0}, {"key": "35574030", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11920292300437761, "ground_truth": 0}, {"key": "35574030", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07030384543130527, "ground_truth": 0}, {"key": "35574030", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01685007978968478, "ground_truth": 0}, {"key": "39105949", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13432104045784707, "ground_truth": 0}, {"key": "39105949", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33807714808103323, "ground_truth": 0}, {"key": "39105949", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21800272169697368, "ground_truth": 0}, {"key": "39105949", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05089372292072532, "ground_truth": 0}, {"key": "39105949", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23161423342123927, "ground_truth": 0}, {"key": "41064322", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.28616926884198957, "ground_truth": 0}, {"key": "41064322", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18359362787471048, "ground_truth": 0}, {"key": "41064322", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18126321084540004, "ground_truth": 0}, {"key": "41064322", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608724875197146, "ground_truth": 0}, {"key": "41064322", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11436852466178178, "ground_truth": 0}, {"key": "28105101", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01128807366608292, "ground_truth": 0}, {"key": "28105101", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.058345838632170965, "ground_truth": 0}, {"key": "28105101", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.018264278147485435, "ground_truth": 0}, {"key": "28105101", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05877655539527425, "ground_truth": 0}, {"key": "28105101", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09739039652638033, "ground_truth": 0}, {"key": "36036068", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049222115872262516, "ground_truth": 0}, {"key": "36036068", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.040087356795151345, "ground_truth": 0}, {"key": "36036068", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06656918689952737, "ground_truth": 0}, {"key": "36036068", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06954174315362104, "ground_truth": 0}, {"key": "36036068", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.031143832691682413, "ground_truth": 0}, {"key": "37991460", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10158945695846634, "ground_truth": 0}, {"key": "37991460", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1112412165049066, "ground_truth": 0}, {"key": "37991460", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19072402343040493, "ground_truth": 0}, {"key": "37991460", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15817435639228056, "ground_truth": 0}, {"key": "37991460", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09073548737158554, "ground_truth": 0}, {"key": "38437830", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.059866417642697387, "ground_truth": 0}, {"key": "38437830", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06608537301355843, "ground_truth": 0}, {"key": "38437830", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21469142085185508, "ground_truth": 0}, {"key": "38437830", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002883058341013, "ground_truth": 0}, {"key": "38437830", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10052487506266207, "ground_truth": 0}, {"key": "36507138", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.015189048960335851, "ground_truth": 0}, {"key": "36507138", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013020489732646941, "ground_truth": 0}, {"key": "36507138", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010735162864501768, "ground_truth": 0}, {"key": "36507138", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009055264110933357, "ground_truth": 0}, {"key": "36507138", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012771867205717026, "ground_truth": 0}, {"key": "37824866", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21667377834504362, "ground_truth": 0}, {"key": "37824866", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10123347698037435, "ground_truth": 0}, {"key": "37824866", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04552200713779611, "ground_truth": 0}, {"key": "37824866", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06210312110766562, "ground_truth": 0}, {"key": "37824866", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07107366566422321, "ground_truth": 0}, {"key": "25088134", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04707418007221424, "ground_truth": 0}, {"key": "25088134", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.047780067550966185, "ground_truth": 0}, {"key": "25088134", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14223188763527153, "ground_truth": 0}, {"key": "25088134", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.727975435610614, "ground_truth": 0}, {"key": "25088134", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608723918525338, "ground_truth": 0}, {"key": "40172531", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.032589741942371436, "ground_truth": 0}, {"key": "40172531", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10158944969008807, "ground_truth": 0}, {"key": "40172531", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06681232860569038, "ground_truth": 0}, {"key": "40172531", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06878728294774689, "ground_truth": 0}, {"key": "40172531", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357959429670694, "ground_truth": 0}, {"key": "37035874", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31912138535650647, "ground_truth": 0}, {"key": "37035874", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25534364812896404, "ground_truth": 0}, {"key": "37035874", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.40544873545583027, "ground_truth": 0}, {"key": "37035874", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.36477756898362923, "ground_truth": 0}, {"key": "37035874", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051745675062, "ground_truth": 0}, {"key": "36404465", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.49218812459138434, "ground_truth": 0}, {"key": "36404465", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4532618481587836, "ground_truth": 0}, {"key": "36404465", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.566018535419899, "ground_truth": 0}, {"key": "36404465", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.468790623733009, "ground_truth": 0}, {"key": "36404465", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24436302603593818, "ground_truth": 0}, {"key": "39602052", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06052939058689765, "ground_truth": 0}, {"key": "39602052", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09203286363471565, "ground_truth": 0}, {"key": "39602052", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09947020699033755, "ground_truth": 0}, {"key": "39602052", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06512754919583985, "ground_truth": 0}, {"key": "39602052", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1233656161695392, "ground_truth": 0}, {"key": "33792789", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07531230869056123, "ground_truth": 0}, {"key": "33792789", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08694166090368023, "ground_truth": 0}, {"key": "33792789", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.31912138165485404, "ground_truth": 0}, {"key": "33792789", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10894504222247914, "ground_truth": 0}, {"key": "33792789", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15507847521695928, "ground_truth": 0}, {"key": "32776626", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04451442676622041, "ground_truth": 0}, {"key": "32776626", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04023794465673423, "ground_truth": 0}, {"key": "32776626", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.023870834560183383, "ground_truth": 0}, {"key": "32776626", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.040845718271861765, "ground_truth": 0}, {"key": "32776626", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027480693118712207, "ground_truth": 0}, {"key": "37195090", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027795625297514143, "ground_truth": 0}, {"key": "37195090", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.015663648834673374, "ground_truth": 0}, {"key": "37195090", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.045692030775181726, "ground_truth": 0}, {"key": "37195090", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05127241947020622, "ground_truth": 0}, {"key": "37195090", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.033085977814546155, "ground_truth": 0}, {"key": "33981824", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.258325969198293, "ground_truth": 0}, {"key": "33981824", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4590761297560133, "ground_truth": 0}, {"key": "33981824", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29259531880047585, "ground_truth": 0}, {"key": "33981824", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.28616925475715277, "ground_truth": 0}, {"key": "33981824", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206881113100978, "ground_truth": 0}, {"key": "39569142", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.47073661718250226, "ground_truth": 0}, {"key": "39569142", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.39047583327065843, "ground_truth": 0}, {"key": "39569142", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7170118698544607, "ground_truth": 0}, {"key": "39569142", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111972708987714, "ground_truth": 0}, {"key": "39569142", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213683967746, "ground_truth": 0}, {"key": "40268210", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1699562383975325, "ground_truth": 0}, {"key": "40268210", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0913821019108655, "ground_truth": 0}, {"key": "40268210", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10158944883608295, "ground_truth": 0}, {"key": "40268210", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610490220974343, "ground_truth": 0}, {"key": "40268210", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2337063560536994, "ground_truth": 0}, {"key": "34925159", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03448852389784626, "ground_truth": 0}, {"key": "34925159", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01542455201876003, "ground_truth": 0}, {"key": "34925159", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08093670961115727, "ground_truth": 0}, {"key": "34925159", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02585877722588339, "ground_truth": 0}, {"key": "34925159", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213556105123, "ground_truth": 0}, {"key": "36181903", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18476750008660814, "ground_truth": 0}, {"key": "36181903", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15921740301854434, "ground_truth": 0}, {"key": "36181903", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6926419942331903, "ground_truth": 0}, {"key": "36181903", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12506538330936057, "ground_truth": 0}, {"key": "36181903", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.40168781444224894, "ground_truth": 0}, {"key": "38620559", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7170118671056823, "ground_truth": 0}, {"key": "38620559", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6584174991145336, "ground_truth": 0}, {"key": "38620559", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3522017966107917, "ground_truth": 0}, {"key": "38620559", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526751354032, "ground_truth": 0}, {"key": "38620559", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300520055678, "ground_truth": 0}, {"key": "32719657", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.018689307184691386, "ground_truth": 0}, {"key": "32719657", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.053998842747479986, "ground_truth": 0}, {"key": "32719657", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07613247788653722, "ground_truth": 0}, {"key": "32719657", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04689925867956164, "ground_truth": 0}, {"key": "32719657", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02002343924958696, "ground_truth": 0}, {"key": "37530914", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08632348126115558, "ground_truth": 0}, {"key": "37530914", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.31237001081302657, "ground_truth": 0}, {"key": "37530914", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14511536334240804, "ground_truth": 0}, {"key": "37530914", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610489123237425, "ground_truth": 0}, {"key": "37530914", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24653334328980553, "ground_truth": 0}, {"key": "33306933", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09501304797406009, "ground_truth": 0}, {"key": "33306933", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15102780419646525, "ground_truth": 0}, {"key": "33306933", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.31405055142357974, "ground_truth": 0}, {"key": "33306933", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798744551680166, "ground_truth": 0}, {"key": "33306933", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10743746748630072, "ground_truth": 0}, {"key": "33837212", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08694166391066598, "ground_truth": 0}, {"key": "33837212", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12592276835610192, "ground_truth": 0}, {"key": "33837212", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0408457170638145, "ground_truth": 0}, {"key": "33837212", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838509096159595, "ground_truth": 0}, {"key": "33837212", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09602549073673794, "ground_truth": 0}, {"key": "40945179", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1347759177904543, "ground_truth": 0}, {"key": "40945179", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1159607126793292, "ground_truth": 0}, {"key": "40945179", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14128142526781193, "ground_truth": 0}, {"key": "40945179", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06705628678672676, "ground_truth": 0}, {"key": "40945179", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11920292327424316, "ground_truth": 0}, {"key": "34152358", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04922211418972139, "ground_truth": 0}, {"key": "34152358", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09602549537659778, "ground_truth": 0}, {"key": "34152358", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07211219712997964, "ground_truth": 0}, {"key": "34152358", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03704716778680754, "ground_truth": 0}, {"key": "34152358", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.057493279072579555, "ground_truth": 0}, {"key": "34136541", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20689406284867842, "ground_truth": 0}, {"key": "34136541", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.43014734439652585, "ground_truth": 0}, {"key": "34136541", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3345894446779789, "ground_truth": 0}, {"key": "34136541", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981166310861793, "ground_truth": 0}, {"key": "34136541", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23792990217078333, "ground_truth": 0}, {"key": "37469603", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01994693598370233, "ground_truth": 0}, {"key": "37469603", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03846619346763492, "ground_truth": 0}, {"key": "37469603", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.016785491335542024, "ground_truth": 0}, {"key": "37469603", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03258974350550599, "ground_truth": 0}, {"key": "37469603", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03789242687134808, "ground_truth": 0}, {"key": "37353611", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0465512745882227, "ground_truth": 0}, {"key": "37353611", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00952248622903087, "ground_truth": 0}, {"key": "37353611", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02112519372484505, "ground_truth": 0}, {"key": "37353611", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.011597361134992544, "ground_truth": 0}, {"key": "37353611", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01621503041231495, "ground_truth": 0}, {"key": "37211649", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05582313992538738, "ground_truth": 0}, {"key": "37211649", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07211220093960653, "ground_truth": 0}, {"key": "37211649", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06853749435661778, "ground_truth": 0}, {"key": "37211649", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.041152886436964575, "ground_truth": 0}, {"key": "37211649", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08882029253618705, "ground_truth": 0}, {"key": "37320976", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02136888568649926, "ground_truth": 0}, {"key": "37320976", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02489280248392935, "ground_truth": 0}, {"key": "37320976", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.059428216932045815, "ground_truth": 0}, {"key": "37320976", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.027272668433421254, "ground_truth": 0}, {"key": "37320976", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06754669043022342, "ground_truth": 0}, {"key": "34492412", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6206216089816879, "ground_truth": 0}, {"key": "34492412", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5698526467729167, "ground_truth": 0}, {"key": "34492412", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8272706867057966, "ground_truth": 0}, {"key": "34492412", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6984323141681563, "ground_truth": 0}, {"key": "34492412", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843800748155019, "ground_truth": 0}, {"key": "36655016", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2254166087681905, "ground_truth": 0}, {"key": "36655016", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08663206894364557, "ground_truth": 0}, {"key": "36655016", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2281564994279912, "ground_truth": 0}, {"key": "36655016", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11676401646760215, "ground_truth": 0}, {"key": "36655016", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344542874131626, "ground_truth": 0}, {"key": "35220773", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21206880828960462, "ground_truth": 0}, {"key": "35220773", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1613202373594503, "ground_truth": 0}, {"key": "35220773", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4339814729664101, "ground_truth": 0}, {"key": "35220773", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417514740141, "ground_truth": 0}, {"key": "35220773", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.259075103396444, "ground_truth": 0}, {"key": "31569808", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3328523272022133, "ground_truth": 0}, {"key": "31569808", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11676401344538881, "ground_truth": 0}, {"key": "31569808", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23934934218419507, "ground_truth": 0}, {"key": "31569808", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12852513942190263, "ground_truth": 0}, {"key": "31569808", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735743946406735, "ground_truth": 0}, {"key": "37696256", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04146227415251396, "ground_truth": 0}, {"key": "37696256", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10818895460057362, "ground_truth": 0}, {"key": "37696256", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06804042312001714, "ground_truth": 0}, {"key": "37696256", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203224358909476, "ground_truth": 0}, {"key": "37696256", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04451443182249617, "ground_truth": 0}, {"key": "36874328", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.039638837748644136, "ground_truth": 0}, {"key": "36874328", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0235992963309288, "ground_truth": 0}, {"key": "36874328", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06233103769867724, "ground_truth": 0}, {"key": "36874328", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030675797725634096, "ground_truth": 0}, {"key": "36874328", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.041930526674500174, "ground_truth": 0}, {"key": "24532377", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4590761393463847, "ground_truth": 0}, {"key": "24532377", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3415824842943782, "ground_truth": 0}, {"key": "24532377", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25608710585172584, "ground_truth": 0}, {"key": "24532377", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995779457426, "ground_truth": 0}, {"key": "24532377", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167448438624, "ground_truth": 0}, {"key": "39560618", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10594827862632185, "ground_truth": 0}, {"key": "39560618", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13386748956608902, "ground_truth": 0}, {"key": "39560618", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1634454385011994, "ground_truth": 0}, {"key": "39560618", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0639484165455652, "ground_truth": 0}, {"key": "39560618", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08389038787803046, "ground_truth": 0}, {"key": "34922693", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03567855321538467, "ground_truth": 0}, {"key": "34922693", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02333076781189101, "ground_truth": 0}, {"key": "34922693", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.046378207198692414, "ground_truth": 0}, {"key": "34922693", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.038178273773166196, "ground_truth": 0}, {"key": "34922693", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669059629837137, "ground_truth": 0}, {"key": "33629577", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24580845958468212, "ground_truth": 0}, {"key": "33629577", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2583259672509832, "ground_truth": 0}, {"key": "33629577", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20181322163368381, "ground_truth": 0}, {"key": "33629577", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405545914881145, "ground_truth": 0}, {"key": "33629577", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420095089675206, "ground_truth": 0}, {"key": "32284359", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.044018651114094545, "ground_truth": 0}, {"key": "32284359", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04885778093616601, "ground_truth": 0}, {"key": "32284359", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11516222857128508, "ground_truth": 0}, {"key": "32284359", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0980793220633906, "ground_truth": 0}, {"key": "32284359", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08819004613836384, "ground_truth": 0}, {"key": "28082962", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24220562173613364, "ground_truth": 0}, {"key": "28082962", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1285251280372186, "ground_truth": 0}, {"key": "28082962", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.33111973777720655, "ground_truth": 0}, {"key": "28082962", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720262470552, "ground_truth": 0}, {"key": "28082962", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1451153676235354, "ground_truth": 0}, {"key": "24796803", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5736784117942765, "ground_truth": 0}, {"key": "24796803", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.48828338014241685, "ground_truth": 0}, {"key": "24796803", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3960681640215379, "ground_truth": 0}, {"key": "24796803", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974735720240216, "ground_truth": 0}, {"key": "24796803", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.361164719826061, "ground_truth": 0}, {"key": "35466150", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08181271340191422, "ground_truth": 0}, {"key": "35466150", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08663206858425081, "ground_truth": 0}, {"key": "35466150", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17328819888414393, "ground_truth": 0}, {"key": "35466150", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08093670991443784, "ground_truth": 0}, {"key": "35466150", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106118079647822, "ground_truth": 0}, {"key": "35754289", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1112412113594729, "ground_truth": 0}, {"key": "35754289", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15405756459880907, "ground_truth": 0}, {"key": "35754289", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20689406823796064, "ground_truth": 0}, {"key": "35754289", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958852363223, "ground_truth": 0}, {"key": "35754289", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06705628522228259, "ground_truth": 0}, {"key": "36678662", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1500288206769398, "ground_truth": 0}, {"key": "36678662", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06878727956245759, "ground_truth": 0}, {"key": "36678662", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09739040527023778, "ground_truth": 0}, {"key": "36678662", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0832919288923553, "ground_truth": 0}, {"key": "36678662", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08977329164609738, "ground_truth": 0}, {"key": "35399671", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15610489336541888, "ground_truth": 0}, {"key": "35399671", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2782567945772236, "ground_truth": 0}, {"key": "35399671", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5039061631458177, "ground_truth": 0}, {"key": "35399671", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.31742626856260536, "ground_truth": 0}, {"key": "35399671", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11436852441525698, "ground_truth": 0}, {"key": "36888180", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14706453045104328, "ground_truth": 0}, {"key": "36888180", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1688569480121581, "ground_truth": 0}, {"key": "36888180", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13846179124198926, "ground_truth": 0}, {"key": "36888180", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2107663001991125, "ground_truth": 0}, {"key": "36888180", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1766716079304066, "ground_truth": 0}, {"key": "28061069", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16451645581467178, "ground_truth": 0}, {"key": "28061069", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04518375573370491, "ground_truth": 0}, {"key": "28061069", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14608724746733992, "ground_truth": 0}, {"key": "28061069", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07185126875901182, "ground_truth": 0}, {"key": "28061069", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19436782376704334, "ground_truth": 0}, {"key": "22259982", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12852513486488792, "ground_truth": 0}, {"key": "22259982", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4455295409451236, "ground_truth": 0}, {"key": "22259982", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.36840571263301314, "ground_truth": 0}, {"key": "22259982", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2133771743535294, "ground_truth": 0}, {"key": "22259982", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953520668837588, "ground_truth": 0}, {"key": "34026805", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19072401857337526, "ground_truth": 0}, {"key": "34026805", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4016878028977875, "ground_truth": 0}, {"key": "34026805", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3259495262141606, "ground_truth": 0}, {"key": "34026805", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553806881223405, "ground_truth": 0}, {"key": "34026805", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05300977213949611, "ground_truth": 0}, {"key": "36713809", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13206615371451907, "ground_truth": 0}, {"key": "36713809", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.209469693557182, "ground_truth": 0}, {"key": "36713809", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23651623526143356, "ground_truth": 0}, {"key": "36713809", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237001925910735, "ground_truth": 0}, {"key": "36713809", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594952203293787, "ground_truth": 0}, {"key": "39726411", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07751765765216254, "ground_truth": 0}, {"key": "39726411", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06187598803367632, "ground_truth": 0}, {"key": "39726411", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10781264859742588, "ground_truth": 0}, {"key": "39726411", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09982065779266376, "ground_truth": 0}, {"key": "39726411", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07779744878183083, "ground_truth": 0}, {"key": "37069841", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028220987930677406, "ground_truth": 0}, {"key": "37069841", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012576348705933093, "ground_truth": 0}, {"key": "37069841", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03258974219907914, "ground_truth": 0}, {"key": "37069841", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030908962413270125, "ground_truth": 0}, {"key": "37069841", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03488088691703492, "ground_truth": 0}, {"key": "38894693", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03904829026438719, "ground_truth": 0}, {"key": "38894693", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028652669235995007, "ground_truth": 0}, {"key": "38894693", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01646617436137999, "ground_truth": 0}, {"key": "38894693", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.045862666081949985, "ground_truth": 0}, {"key": "38894693", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.017509556123928006, "ground_truth": 0}, {"key": "33946032", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20689404865051772, "ground_truth": 0}, {"key": "33946032", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18832398725828275, "ground_truth": 0}, {"key": "33946032", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2704802177351344, "ground_truth": 0}, {"key": "33946032", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337716967612988, "ground_truth": 0}, {"key": "33946032", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07921031717236438, "ground_truth": 0}, {"key": "39035311", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.48828341453496527, "ground_truth": 0}, {"key": "39035311", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5214711611918602, "ground_truth": 0}, {"key": "39035311", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5602526610238868, "ground_truth": 0}, {"key": "39035311", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358254960059, "ground_truth": 0}, {"key": "39035311", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397045463724, "ground_truth": 0}, {"key": "27680038", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03308597821711553, "ground_truth": 0}, {"key": "27680038", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08570928054885874, "ground_truth": 0}, {"key": "27680038", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02605630568192316, "ground_truth": 0}, {"key": "27680038", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08819003594427124, "ground_truth": 0}, {"key": "27680038", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02727266966773406, "ground_truth": 0}, {"key": "36901907", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19806417346284141, "ground_truth": 0}, {"key": "36901907", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1778108785543967, "ground_truth": 0}, {"key": "36901907", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2107662910032826, "ground_truth": 0}, {"key": "36901907", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2200070942033166, "ground_truth": 0}, {"key": "36901907", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08151975404148529, "ground_truth": 0}, {"key": "21530542", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11397345828032027, "ground_truth": 0}, {"key": "21530542", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11961366285762635, "ground_truth": 0}, {"key": "21530542", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01518904956810043, "ground_truth": 0}, {"key": "21530542", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0783598097395174, "ground_truth": 0}, {"key": "21530542", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08035746575004568, "ground_truth": 0}, {"key": "38192532", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5117166003447025, "ground_truth": 0}, {"key": "38192532", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5698526585720501, "ground_truth": 0}, {"key": "38192532", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5869964286421578, "ground_truth": 0}, {"key": "38192532", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760161049676, "ground_truth": 0}, {"key": "38192532", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268346651397664, "ground_truth": 0}, {"key": "34102400", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01040831456765282, "ground_truth": 0}, {"key": "34102400", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0035380863662876232, "ground_truth": 0}, {"key": "34102400", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.008030813465112705, "ground_truth": 0}, {"key": "34102400", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020488553730542775, "ground_truth": 0}, {"key": "34102400", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.006192990146183743, "ground_truth": 0}, {"key": "36133399", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.019050898518184978, "ground_truth": 0}, {"key": "36133399", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028761588138206902, "ground_truth": 0}, {"key": "36133399", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02987309186123301, "ground_truth": 0}, {"key": "36133399", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.042087727685262186, "ground_truth": 0}, {"key": "36133399", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.032589740579744515, "ground_truth": 0}, {"key": "34314544", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0967057915904975, "ground_truth": 0}, {"key": "34314544", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04161779539599759, "ground_truth": 0}, {"key": "34314544", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1384617860441649, "ground_truth": 0}, {"key": "34314544", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.033971998471090344, "ground_truth": 0}, {"key": "34314544", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.048136767716665065, "ground_truth": 0}, {"key": "33460074", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02615561894198887, "ground_truth": 0}, {"key": "33460074", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028220987794971564, "ground_truth": 0}, {"key": "33460074", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.020488553701633164, "ground_truth": 0}, {"key": "33460074", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03296124360018443, "ground_truth": 0}, {"key": "33460074", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016340128669975994, "ground_truth": 0}, {"key": "36191495", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.057918087707728536, "ground_truth": 0}, {"key": "36191495", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10818895963764995, "ground_truth": 0}, {"key": "36191495", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07211219962356233, "ground_truth": 0}, {"key": "36191495", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08756384081825987, "ground_truth": 0}, {"key": "36191495", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16885695442182178, "ground_truth": 0}, {"key": "39532668", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09947021208437354, "ground_truth": 0}, {"key": "39532668", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.009449081257660044, "ground_truth": 0}, {"key": "39532668", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02737648915582166, "ground_truth": 0}, {"key": "39532668", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.015603532295782792, "ground_truth": 0}, {"key": "39532668", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07751765856824387, "ground_truth": 0}, {"key": "20328247", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04401865582257771, "ground_truth": 0}, {"key": "20328247", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005281333890118944, "ground_truth": 0}, {"key": "20328247", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.034749625983293855, "ground_truth": 0}, {"key": "20328247", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.034618840234239556, "ground_truth": 0}, {"key": "20328247", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04336580244256627, "ground_truth": 0}, {"key": "39112675", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031618767674239455, "ground_truth": 0}, {"key": "39112675", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0344885242734864, "ground_truth": 0}, {"key": "39112675", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.015845361373651088, "ground_truth": 0}, {"key": "39112675", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04760265819879954, "ground_truth": 0}, {"key": "39112675", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008156249125049706, "ground_truth": 0}, {"key": "31620300", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.004416556063430073, "ground_truth": 0}, {"key": "31620300", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.024423091708009156, "ground_truth": 0}, {"key": "31620300", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06097518506095877, "ground_truth": 0}, {"key": "31620300", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0369080673085489, "ground_truth": 0}, {"key": "31620300", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05791808962768347, "ground_truth": 0}, {"key": "37518509", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3106944054411704, "ground_truth": 0}, {"key": "37518509", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22135068763934163, "ground_truth": 0}, {"key": "37518509", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.37937841450016624, "ground_truth": 0}, {"key": "37518509", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295257036469, "ground_truth": 0}, {"key": "37518509", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881330330038, "ground_truth": 0}, {"key": "35454095", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.030792165366838452, "ground_truth": 0}, {"key": "35454095", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020725062943325778, "ground_truth": 0}, {"key": "35454095", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04535257977136312, "ground_truth": 0}, {"key": "35454095", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022889841051358707, "ground_truth": 0}, {"key": "35454095", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040845715816222455, "ground_truth": 0}, {"key": "38542788", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07030384498238541, "ground_truth": 0}, {"key": "38542788", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.053009773516191586, "ground_truth": 0}, {"key": "38542788", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16132024269510623, "ground_truth": 0}, {"key": "38542788", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07613248183139058, "ground_truth": 0}, {"key": "38542788", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06210312178739078, "ground_truth": 0}, {"key": "23944937", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028761589171935394, "ground_truth": 0}, {"key": "23944937", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06233103582753811, "ground_truth": 0}, {"key": "23944937", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10818895186449189, "ground_truth": 0}, {"key": "23944937", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03567855411344313, "ground_truth": 0}, {"key": "23944937", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05261895430972074, "ground_truth": 0}, {"key": "31753944", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.004736748704372592, "ground_truth": 0}, {"key": "31753944", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0018895387173419578, "ground_truth": 0}, {"key": "31753944", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.004451041453375905, "ground_truth": 0}, {"key": "31753944", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.005405899773723353, "ground_truth": 0}, {"key": "31753944", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.004829721865798866, "ground_truth": 0}, {"key": "35527214", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04742587381008297, "ground_truth": 0}, {"key": "35527214", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.037608633855046064, "ground_truth": 0}, {"key": "35527214", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.062789205714541, "ground_truth": 0}, {"key": "35527214", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10302443074511611, "ground_truth": 0}, {"key": "35527214", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06418264336753621, "ground_truth": 0}, {"key": "40400404", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.26435837383965444, "ground_truth": 0}, {"key": "40400404", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03234432918654127, "ground_truth": 0}, {"key": "40400404", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09401018553460218, "ground_truth": 0}, {"key": "40400404", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06394842193947844, "ground_truth": 0}, {"key": "40400404", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0474258734568652, "ground_truth": 0}, {"key": "21713119", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10932482482004859, "ground_truth": 0}, {"key": "21713119", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15559099282595085, "ground_truth": 0}, {"key": "21713119", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09367800365971819, "ground_truth": 0}, {"key": "21713119", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13986564909358448, "ground_truth": 0}, {"key": "21713119", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16505408866898988, "ground_truth": 0}, {"key": "28730678", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07477004929081123, "ground_truth": 0}, {"key": "28730678", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06536578243269489, "ground_truth": 0}, {"key": "28730678", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1289632932972604, "ground_truth": 0}, {"key": "28730678", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10158944914505405, "ground_truth": 0}, {"key": "28730678", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09982066323066598, "ground_truth": 0}, {"key": "36823733", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19436781495204822, "ground_truth": 0}, {"key": "36823733", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25832597722491396, "ground_truth": 0}, {"key": "36823733", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.254601612981077, "ground_truth": 0}, {"key": "36823733", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124121815125726, "ground_truth": 0}, {"key": "36823733", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.258325977748688, "ground_truth": 0}, {"key": "35988862", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02716923221789503, "ground_truth": 0}, {"key": "35988862", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06097517989989195, "ground_truth": 0}, {"key": "35988862", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.035012627471592436, "ground_truth": 0}, {"key": "35988862", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.041307304007258995, "ground_truth": 0}, {"key": "35988862", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.010944577391723654, "ground_truth": 0}, {"key": "40499665", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10781263804110272, "ground_truth": 0}, {"key": "40499665", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06008664823221176, "ground_truth": 0}, {"key": "40499665", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13072869240965257, "ground_truth": 0}, {"key": "40499665", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1167640146154258, "ground_truth": 0}, {"key": "40499665", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1250653882014518, "ground_truth": 0}, {"key": "32829820", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010611421375134517, "ground_truth": 0}, {"key": "32829820", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028436033036236853, "ground_truth": 0}, {"key": "32829820", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013848611027617502, "ground_truth": 0}, {"key": "32829820", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.038035096991085704, "ground_truth": 0}, {"key": "32829820", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.013070785103022063, "ground_truth": 0}, {"key": "20583553", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6085940241106349, "ground_truth": 0}, {"key": "20583553", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.700894796838684, "ground_truth": 0}, {"key": "20583553", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5097643680448206, "ground_truth": 0}, {"key": "20583553", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468889472804, "ground_truth": 0}, {"key": "20583553", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4717099528109396, "ground_truth": 0}, {"key": "30501550", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5525396993806037, "ground_truth": 0}, {"key": "30501550", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5331543907927202, "ground_truth": 0}, {"key": "30501550", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8104789028834625, "ground_truth": 0}, {"key": "30501550", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357482118115, "ground_truth": 0}, {"key": "30501550", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.781330636116725, "ground_truth": 0}, {"key": "38755897", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22678362969322516, "ground_truth": 0}, {"key": "38755897", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.143667613332925, "ground_truth": 0}, {"key": "38755897", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25757828261180626, "ground_truth": 0}, {"key": "38755897", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2814056184858988, "ground_truth": 0}, {"key": "38755897", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23022675524917424, "ground_truth": 0}, {"key": "35507201", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.026556572350305344, "ground_truth": 0}, {"key": "35507201", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17553806081109527, "ground_truth": 0}, {"key": "35507201", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06008664669483469, "ground_truth": 0}, {"key": "35507201", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.014899643997041722, "ground_truth": 0}, {"key": "35507201", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01994693417951183, "ground_truth": 0}, {"key": "36453511", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031143831759067587, "ground_truth": 0}, {"key": "36453511", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04958902531128195, "ground_truth": 0}, {"key": "36453511", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08419107664738812, "ground_truth": 0}, {"key": "36453511", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06608537157935279, "ground_truth": 0}, {"key": "36453511", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1755380657912996, "ground_truth": 0}, {"key": "38066835", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0803574686707543, "ground_truth": 0}, {"key": "38066835", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17895590495874086, "ground_truth": 0}, {"key": "38066835", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14414885705908664, "ground_truth": 0}, {"key": "38066835", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19682620838537793, "ground_truth": 0}, {"key": "38066835", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0680404240731241, "ground_truth": 0}, {"key": "39697181", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02537131286318873, "ground_truth": 0}, {"key": "39697181", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01927113711387321, "ground_truth": 0}, {"key": "39697181", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.020645930988669698, "ground_truth": 0}, {"key": "39697181", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04434857941179649, "ground_truth": 0}, {"key": "39697181", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.009559399490008199, "ground_truth": 0}, {"key": "21820893", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06348235896160277, "ground_truth": 0}, {"key": "21820893", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03173859077091986, "ground_truth": 0}, {"key": "21820893", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027480693222503155, "ground_truth": 0}, {"key": "21820893", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.031026180859201682, "ground_truth": 0}, {"key": "21820893", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05184546504866641, "ground_truth": 0}, {"key": "40519933", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0075187182184926656, "ground_truth": 0}, {"key": "40519933", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.007636216089804106, "ground_truth": 0}, {"key": "40519933", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02498779535035219, "ground_truth": 0}, {"key": "40519933", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013902059567787934, "ground_truth": 0}, {"key": "40519933", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.021287351062565983, "ground_truth": 0}, {"key": "30446033", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18952109299781747, "ground_truth": 0}, {"key": "30446033", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2720245572291436, "ground_truth": 0}, {"key": "30446033", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19682621032991277, "ground_truth": 0}, {"key": "30446033", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33807714178411385, "ground_truth": 0}, {"key": "30446033", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541661872288632, "ground_truth": 0}, {"key": "40216291", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12940272967498342, "ground_truth": 0}, {"key": "40216291", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11676400896974698, "ground_truth": 0}, {"key": "40216291", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06512754780249815, "ground_truth": 0}, {"key": "40216291", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132024182785537, "ground_truth": 0}, {"key": "40216291", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06233104083514443, "ground_truth": 0}, {"key": "33479118", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11436853254025516, "ground_truth": 0}, {"key": "33479118", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3522017786471311, "ground_truth": 0}, {"key": "33479118", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21601153681297064, "ground_truth": 0}, {"key": "33479118", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2942149629491729, "ground_truth": 0}, {"key": "33479118", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284185876303395, "ground_truth": 0}, {"key": "22297373", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09401017772408288, "ground_truth": 0}, {"key": "22297373", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.46295863079844063, "ground_truth": 0}, {"key": "22297373", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.169956238397152, "ground_truth": 0}, {"key": "22297373", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245688751516, "ground_truth": 0}, {"key": "22297373", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09334687905714191, "ground_truth": 0}, {"key": "36463668", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.48047866319070354, "ground_truth": 0}, {"key": "36463668", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32594952585953324, "ground_truth": 0}, {"key": "36463668", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6601723741603075, "ground_truth": 0}, {"key": "36463668", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.43206339993017123, "ground_truth": 0}, {"key": "36463668", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758390867588, "ground_truth": 0}, {"key": "35264615", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03044434883098979, "ground_truth": 0}, {"key": "35264615", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05261895373284681, "ground_truth": 0}, {"key": "35264615", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06853748888433235, "ground_truth": 0}, {"key": "35264615", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08913692613908139, "ground_truth": 0}, {"key": "35264615", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13568953557518837, "ground_truth": 0}, {"key": "39898482", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15974101903563453, "ground_truth": 0}, {"key": "39898482", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13296424731471126, "ground_truth": 0}, {"key": "39898482", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17497346012413223, "ground_truth": 0}, {"key": "39898482", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010667425182134, "ground_truth": 0}, {"key": "39898482", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18476752012151157, "ground_truth": 0}, {"key": "37228721", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0488577822169942, "ground_truth": 0}, {"key": "37228721", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08913693175804224, "ground_truth": 0}, {"key": "37228721", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03308597794865301, "ground_truth": 0}, {"key": "37228721", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016529557841583473, "ground_truth": 0}, {"key": "37228721", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03197956167723589, "ground_truth": 0}, {"key": "24535799", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.932943713000743, "ground_truth": 0}, {"key": "24535799", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8459424440756383, "ground_truth": 0}, {"key": "24535799", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7371581653646159, "ground_truth": 0}, {"key": "24535799", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9082930339928703, "ground_truth": 0}, {"key": "24535799", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096153851159, "ground_truth": 0}, {"key": "35177759", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.019794780723657653, "ground_truth": 0}, {"key": "35177759", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02508314018812143, "ground_truth": 0}, {"key": "35177759", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026861202457851747, "ground_truth": 0}, {"key": "35177759", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0249877957033054, "ground_truth": 0}, {"key": "35177759", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0352775485582397, "ground_truth": 0}, {"key": "34364829", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03622005958514776, "ground_truth": 0}, {"key": "34364829", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020884216044297944, "ground_truth": 0}, {"key": "34364829", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027376489504723257, "ground_truth": 0}, {"key": "34364829", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.059646937661226314, "ground_truth": 0}, {"key": "34364829", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016657039877495998, "ground_truth": 0}, {"key": "38090732", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06465348711256888, "ground_truth": 0}, {"key": "38090732", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09009299055827784, "ground_truth": 0}, {"key": "38090732", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06164962036544219, "ground_truth": 0}, {"key": "38090732", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08151974911245381, "ground_truth": 0}, {"key": "38090732", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405546621984998, "ground_truth": 0}, {"key": "30651479", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04586266622360457, "ground_truth": 0}, {"key": "30651479", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04161779636684367, "ground_truth": 0}, {"key": "30651479", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04304284780981981, "ground_truth": 0}, {"key": "30651479", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0396388390961774, "ground_truth": 0}, {"key": "30651479", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.042562730152576875, "ground_truth": 0}, {"key": "39380921", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11124121668895584, "ground_truth": 0}, {"key": "39380921", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10818895892019546, "ground_truth": 0}, {"key": "39380921", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09301679906108874, "ground_truth": 0}, {"key": "39380921", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903529749698904, "ground_truth": 0}, {"key": "39380921", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0532062060850962, "ground_truth": 0}, {"key": "39037490", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049958526155532486, "ground_truth": 0}, {"key": "39037490", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04831606745366845, "ground_truth": 0}, {"key": "39037490", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02451633686649949, "ground_truth": 0}, {"key": "39037490", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06371499653698351, "ground_truth": 0}, {"key": "39037490", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03993731642956483, "ground_truth": 0}, {"key": "35917499", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06754669772839167, "ground_truth": 0}, {"key": "35917499", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20118472942116603, "ground_truth": 0}, {"key": "35917499", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15304215163793478, "ground_truth": 0}, {"key": "35917499", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1108555954521841, "ground_truth": 0}, {"key": "35917499", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1744102776297251, "ground_truth": 0}, {"key": "34908073", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014842417662060526, "ground_truth": 0}, {"key": "34908073", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01554364701436427, "ground_truth": 0}, {"key": "34908073", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013742321543894168, "ground_truth": 0}, {"key": "34908073", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.026861202844248536, "ground_truth": 0}, {"key": "34908073", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05500528198156857, "ground_truth": 0}, {"key": "36344759", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4882833980478699, "ground_truth": 0}, {"key": "36344759", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8019358231426807, "ground_truth": 0}, {"key": "36344759", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7201714962932358, "ground_truth": 0}, {"key": "36344759", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.592666599960869, "ground_truth": 0}, {"key": "36344759", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9069831953478246, "ground_truth": 0}, {"key": "39984637", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09401018743579091, "ground_truth": 0}, {"key": "39984637", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03010033426413694, "ground_truth": 0}, {"key": "39984637", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01927113650435229, "ground_truth": 0}, {"key": "39984637", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03461883984865745, "ground_truth": 0}, {"key": "39984637", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023870836332290965, "ground_truth": 0}, {"key": "17917326", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15662018657243157, "ground_truth": 0}, {"key": "17917326", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.26435836140189084, "ground_truth": 0}, {"key": "17917326", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5525396891277011, "ground_truth": 0}, {"key": "17917326", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.28616926040610435, "ground_truth": 0}, {"key": "17917326", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1655931122503562, "ground_truth": 0}, {"key": "32193638", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.039490403722402104, "ground_truth": 0}, {"key": "32193638", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03161876747380108, "ground_truth": 0}, {"key": "32193638", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03346293188610056, "ground_truth": 0}, {"key": "32193638", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03185885520380725, "ground_truth": 0}, {"key": "32193638", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027066175549548703, "ground_truth": 0}, {"key": "34564692", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19930799332309787, "ground_truth": 0}, {"key": "34564692", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08210662759491853, "ground_truth": 0}, {"key": "34564692", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2030746397034253, "ground_truth": 0}, {"key": "34564692", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1097057755361235, "ground_truth": 0}, {"key": "34564692", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944723281602402, "ground_truth": 0}, {"key": "39329284", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08977328674298844, "ground_truth": 0}, {"key": "39329284", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2720245476304697, "ground_truth": 0}, {"key": "39329284", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.054802595414366016, "ground_truth": 0}, {"key": "39329284", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.049039619834914755, "ground_truth": 0}, {"key": "39329284", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11124121292429844, "ground_truth": 0}, {"key": "37438541", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05184546731615713, "ground_truth": 0}, {"key": "37438541", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.014117893492383713, "ground_truth": 0}, {"key": "37438541", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02832831260523262, "ground_truth": 0}, {"key": "37438541", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.014842418058162759, "ground_truth": 0}, {"key": "37438541", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.010570488344499768, "ground_truth": 0}, {"key": "34652757", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06418264451173307, "ground_truth": 0}, {"key": "34652757", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017509555217795094, "ground_truth": 0}, {"key": "34652757", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03044434790638043, "ground_truth": 0}, {"key": "34652757", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06465348592953633, "ground_truth": 0}, {"key": "34652757", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0467249564537376, "ground_truth": 0}, {"key": "31361004", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20307463315686092, "ground_truth": 0}, {"key": "31361004", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2094696912813898, "ground_truth": 0}, {"key": "31361004", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2494472195595884, "ground_truth": 0}, {"key": "31361004", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168780792249853, "ground_truth": 0}, {"key": "31361004", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651622882798498, "ground_truth": 0}, {"key": "26150727", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02245705433831702, "ground_truth": 0}, {"key": "26150727", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09947021108894019, "ground_truth": 0}, {"key": "26150727", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05964694233953377, "ground_truth": 0}, {"key": "26150727", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05379964311987689, "ground_truth": 0}, {"key": "26150727", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10818895776517874, "ground_truth": 0}, {"key": "36997402", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.162380028401636, "ground_truth": 0}, {"key": "36997402", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03875619388498212, "ground_truth": 0}, {"key": "36997402", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.037186775571911794, "ground_truth": 0}, {"key": "36997402", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08181271062491864, "ground_truth": 0}, {"key": "36997402", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13568954592516175, "ground_truth": 0}, {"key": "37430643", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03161876502526486, "ground_truth": 0}, {"key": "37430643", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02033235373101279, "ground_truth": 0}, {"key": "37430643", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02800752013765392, "ground_truth": 0}, {"key": "37430643", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02228618564691106, "ground_truth": 0}, {"key": "37430643", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.047425872359255355, "ground_truth": 0}, {"key": "36964631", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06348235945349284, "ground_truth": 0}, {"key": "36964631", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07030384639378895, "ground_truth": 0}, {"key": "36964631", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03963884133460089, "ground_truth": 0}, {"key": "36964631", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05686154915840732, "ground_truth": 0}, {"key": "36964631", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.053998836228568506, "ground_truth": 0}, {"key": "35502013", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.020804490339570304, "ground_truth": 0}, {"key": "35502013", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026255302279347106, "ground_truth": 0}, {"key": "35502013", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01868930784618969, "ground_truth": 0}, {"key": "35502013", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018404890362010946, "ground_truth": 0}, {"key": "35502013", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024145421880309735, "ground_truth": 0}, {"key": "33987664", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01596765486422076, "ground_truth": 0}, {"key": "33987664", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005957154362851826, "ground_truth": 0}, {"key": "33987664", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.024987794327798397, "ground_truth": 0}, {"key": "33987664", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02072506195130649, "ground_truth": 0}, {"key": "33987664", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01897803619484743, "ground_truth": 0}, {"key": "35203721", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.00757724111500714, "ground_truth": 0}, {"key": "35203721", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.004348380919803466, "ground_truth": 0}, {"key": "35203721", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.004905405823902287, "ground_truth": 0}, {"key": "35203721", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.033844032871582067, "ground_truth": 0}, {"key": "35203721", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03488088848429823, "ground_truth": 0}, {"key": "39028348", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.008219692976205843, "ground_truth": 0}, {"key": "39028348", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04620575045491521, "ground_truth": 0}, {"key": "39028348", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026963500351262378, "ground_truth": 0}, {"key": "39028348", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013020490022366084, "ground_truth": 0}, {"key": "39028348", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008124709200309901, "ground_truth": 0}, {"key": "37459383", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.030850508646934352, "ground_truth": 0}, {"key": "37459383", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.014199679285849774, "ground_truth": 0}, {"key": "37459383", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03210070780724817, "ground_truth": 0}, {"key": "37459383", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.015365340216863574, "ground_truth": 0}, {"key": "37459383", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.029873091492951885, "ground_truth": 0}, {"key": "34020070", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03044434956997365, "ground_truth": 0}, {"key": "34020070", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04193052469317393, "ground_truth": 0}, {"key": "34020070", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13206615374788672, "ground_truth": 0}, {"key": "34020070", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.035012626488269916, "ground_truth": 0}, {"key": "34020070", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03474962585822279, "ground_truth": 0}, {"key": "35176615", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05419873285995708, "ground_truth": 0}, {"key": "35176615", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08509904357491015, "ground_truth": 0}, {"key": "35176615", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07423136925573642, "ground_truth": 0}, {"key": "35176615", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018761083986466472, "ground_truth": 0}, {"key": "35176615", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05541279179702083, "ground_truth": 0}, {"key": "33296389", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21601152621157627, "ground_truth": 0}, {"key": "33296389", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2240554585188223, "ground_truth": 0}, {"key": "33296389", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0685374935088957, "ground_truth": 0}, {"key": "33296389", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279539712020067, "ground_truth": 0}, {"key": "33296389", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05033063054908875, "ground_truth": 0}, {"key": "35399504", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2094696952418066, "ground_truth": 0}, {"key": "35399504", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16776334756962585, "ground_truth": 0}, {"key": "35399504", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3575675144227902, "ground_truth": 0}, {"key": "35399504", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223189144176898, "ground_truth": 0}, {"key": "35399504", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610156349853, "ground_truth": 0}, {"key": "34807886", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07081620204013687, "ground_truth": 0}, {"key": "34807886", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04099902811197142, "ground_truth": 0}, {"key": "34807886", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10052486815925397, "ground_truth": 0}, {"key": "34807886", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12635334341876317, "ground_truth": 0}, {"key": "34807886", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04401865622794717, "ground_truth": 0}, {"key": "37629813", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.30902370460389145, "ground_truth": 0}, {"key": "37629813", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2393493404888186, "ground_truth": 0}, {"key": "37629813", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17441027100159562, "ground_truth": 0}, {"key": "37629813", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653333819286075, "ground_truth": 0}, {"key": "37629813", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3106943882647774, "ground_truth": 0}, {"key": "28084389", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04369105819043593, "ground_truth": 0}, {"key": "28084389", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32252599719027947, "ground_truth": 0}, {"key": "28084389", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1772405168012787, "ground_truth": 0}, {"key": "28084389", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16721866383870163, "ground_truth": 0}, {"key": "28084389", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610490275625952, "ground_truth": 0}, {"key": "35391734", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "35391734", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.37022538905882896, "ground_truth": 0}, {"key": "35391734", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3345894310154113, "ground_truth": 0}, {"key": "35391734", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.41489882755967217, "ground_truth": 0}, {"key": "35391734", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165105388159, "ground_truth": 0}, {"key": "40214591", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1356895435791109, "ground_truth": 0}, {"key": "40214591", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0742313690306958, "ground_truth": 0}, {"key": "40214591", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10087861994615152, "ground_truth": 0}, {"key": "40214591", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026603757527041, "ground_truth": 0}, {"key": "40214591", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512971231175337, "ground_truth": 0}, {"key": "26283171", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.037047171035621364, "ground_truth": 0}, {"key": "26283171", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.031738588974503684, "ground_truth": 0}, {"key": "26283171", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02333076791785132, "ground_truth": 0}, {"key": "26283171", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022802637826358, "ground_truth": 0}, {"key": "26283171", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02822098773861864, "ground_truth": 0}, {"key": "37084030", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16238002317578773, "ground_truth": 0}, {"key": "37084030", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2227001368755288, "ground_truth": 0}, {"key": "37084030", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13753247281670625, "ground_truth": 0}, {"key": "37084030", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561504645566578, "ground_truth": 0}, {"key": "37084030", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072402689316276, "ground_truth": 0}, {"key": "39027295", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021781171761612296, "ground_truth": 0}, {"key": "39027295", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.044348580566366876, "ground_truth": 0}, {"key": "39027295", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.044680872968255, "ground_truth": 0}, {"key": "39027295", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06512754742383327, "ground_truth": 0}, {"key": "39027295", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.029535338055185753, "ground_truth": 0}, {"key": "14018647", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05582313837473312, "ground_truth": 0}, {"key": "14018647", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.025371311139526922, "ground_truth": 0}, {"key": "14018647", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.034880886906637466, "ground_truth": 0}, {"key": "14018647", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.025760559093219556, "ground_truth": 0}, {"key": "14018647", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.041152889554226094, "ground_truth": 0}, {"key": "37424289", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06371499321590617, "ground_truth": 0}, {"key": "37424289", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09534946259313544, "ground_truth": 0}, {"key": "37424289", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0824015048072881, "ground_truth": 0}, {"key": "37424289", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159120441718796, "ground_truth": 0}, {"key": "37424289", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08181271312238414, "ground_truth": 0}, {"key": "37498031", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0980793201589129, "ground_truth": 0}, {"key": "37498031", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1276526254483068, "ground_truth": 0}, {"key": "37498031", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20181322481230976, "ground_truth": 0}, {"key": "37498031", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026602326604722, "ground_truth": 0}, {"key": "37498031", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.160266041326737, "ground_truth": 0}, {"key": "30104095", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.045352577558531865, "ground_truth": 0}, {"key": "30104095", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10302442172947096, "ground_truth": 0}, {"key": "30104095", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.125922771390418, "ground_truth": 0}, {"key": "30104095", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04084571723990722, "ground_truth": 0}, {"key": "30104095", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660839810074538, "ground_truth": 0}, {"key": "37911407", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16026603152569446, "ground_truth": 0}, {"key": "37911407", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3174262877891666, "ground_truth": 0}, {"key": "37911407", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14511535555053323, "ground_truth": 0}, {"key": "37911407", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14755518801709686, "ground_truth": 0}, {"key": "37911407", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08756384544174727, "ground_truth": 0}, {"key": "39177472", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021368888732297316, "ground_truth": 0}, {"key": "39177472", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.008916127014677803, "ground_truth": 0}, {"key": "39177472", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013480103115154397, "ground_truth": 0}, {"key": "39177472", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021125193941641824, "ground_truth": 0}, {"key": "39177472", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.020023441676048158, "ground_truth": 0}, {"key": "32325454", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09602549218009607, "ground_truth": 0}, {"key": "32325454", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05623634810831007, "ground_truth": 0}, {"key": "32325454", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03608394113416866, "ground_truth": 0}, {"key": "32325454", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07751766070088428, "ground_truth": 0}, {"key": "32325454", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12252321733211075, "ground_truth": 0}, {"key": "38395319", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11516223199228326, "ground_truth": 0}, {"key": "38395319", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.047780069386338775, "ground_truth": 0}, {"key": "38395319", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04208773000440265, "ground_truth": 0}, {"key": "38395319", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0680404246906971, "ground_truth": 0}, {"key": "38395319", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.029201292159070566, "ground_truth": 0}, {"key": "38235895", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02025469145709459, "ground_truth": 0}, {"key": "38235895", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5039061519065637, "ground_truth": 0}, {"key": "38235895", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05340333365049873, "ground_truth": 0}, {"key": "38235895", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06465348980954728, "ground_truth": 0}, {"key": "38235895", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04535258001999872, "ground_truth": 0}, {"key": "26543267", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.33633103895854705, "ground_truth": 0}, {"key": "26543267", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22000710638292093, "ground_truth": 0}, {"key": "26543267", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12765261465292133, "ground_truth": 0}, {"key": "26543267", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19682620920553476, "ground_truth": 0}, {"key": "26543267", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14033625452846332, "ground_truth": 0}, {"key": "39054728", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.789882763279146, "ground_truth": 0}, {"key": "39054728", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8255897229594015, "ground_truth": 0}, {"key": "39054728", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8688267767585495, "ground_truth": 0}, {"key": "39054728", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9136765178720303, "ground_truth": 0}, {"key": "39054728", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392854125437, "ground_truth": 0}, {"key": "39158443", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04742587323187115, "ground_truth": 0}, {"key": "39158443", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "39158443", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07585817821442899, "ground_truth": 0}, {"key": "39158443", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2200070866899359, "ground_truth": 0}, {"key": "39158443", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3242353914342666, "ground_truth": 0}, {"key": "36254201", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028652669605254963, "ground_truth": 0}, {"key": "36254201", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017576884306970464, "ground_truth": 0}, {"key": "36254201", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04054073597342291, "ground_truth": 0}, {"key": "36254201", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016090873773973457, "ground_truth": 0}, {"key": "36254201", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06903792967116533, "ground_truth": 0}, {"key": "23434347", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05203782569788038, "ground_truth": 0}, {"key": "23434347", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.007725534404777524, "ground_truth": 0}, {"key": "23434347", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03949040433835939, "ground_truth": 0}, {"key": "23434347", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05184547148645377, "ground_truth": 0}, {"key": "23434347", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08449275615067021, "ground_truth": 0}, {"key": "34397620", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.036493769022468606, "ground_truth": 0}, {"key": "34397620", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0097461040451291, "ground_truth": 0}, {"key": "34397620", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.008093290215534307, "ground_truth": 0}, {"key": "34397620", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04023794575238801, "ground_truth": 0}, {"key": "34397620", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.00251146382932732, "ground_truth": 0}, {"key": "34340916", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12678517833268055, "ground_truth": 0}, {"key": "34340916", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03622005770562124, "ground_truth": 0}, {"key": "34340916", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15203225123465833, "ground_truth": 0}, {"key": "34340916", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203286403389546, "ground_truth": 0}, {"key": "34340916", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07751765466355234, "ground_truth": 0}, {"key": "30375089", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02048855386692261, "ground_truth": 0}, {"key": "30375089", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.033085977796418205, "ground_truth": 0}, {"key": "30375089", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05582314289567183, "ground_truth": 0}, {"key": "30375089", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03185885666197956, "ground_truth": 0}, {"key": "30375089", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024237635295515318, "ground_truth": 0}, {"key": "35807797", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.017309097335184487, "ground_truth": 0}, {"key": "35807797", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.015663648503835854, "ground_truth": 0}, {"key": "35807797", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.031026179122774313, "ground_truth": 0}, {"key": "35807797", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.032589743262613574, "ground_truth": 0}, {"key": "35807797", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023419945850664238, "ground_truth": 0}, {"key": "34188172", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04922211542489974, "ground_truth": 0}, {"key": "34188172", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08479540955258374, "ground_truth": 0}, {"key": "34188172", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10123348262517771, "ground_truth": 0}, {"key": "34188172", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05460060598784161, "ground_truth": 0}, {"key": "34188172", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316472081131128, "ground_truth": 0}, {"key": "37075567", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1470645266045934, "ground_truth": 0}, {"key": "37075567", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08389038710166953, "ground_truth": 0}, {"key": "37075567", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22000708910612457, "ground_truth": 0}, {"key": "37075567", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08977329494283201, "ground_truth": 0}, {"key": "37075567", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15921740262714384, "ground_truth": 0}, {"key": "35559735", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09739040061113592, "ground_truth": 0}, {"key": "35559735", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09534945694736316, "ground_truth": 0}, {"key": "35559735", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.062331034694502574, "ground_truth": 0}, {"key": "35559735", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08756384018110927, "ground_truth": 0}, {"key": "35559735", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669060319552227, "ground_truth": 0}, {"key": "33005019", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03978780867808957, "ground_truth": 0}, {"key": "33005019", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.010944576990907942, "ground_truth": 0}, {"key": "33005019", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01934510360165992, "ground_truth": 0}, {"key": "33005019", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08181271081795992, "ground_truth": 0}, {"key": "33005019", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.041617796953154575, "ground_truth": 0}, {"key": "30808252", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08329192283607474, "ground_truth": 0}, {"key": "30808252", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09268777428238778, "ground_truth": 0}, {"key": "30808252", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06754669489876172, "ground_truth": 0}, {"key": "30808252", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09602549575965737, "ground_truth": 0}, {"key": "30808252", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106119007440346, "ground_truth": 0}, {"key": "15159017", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02169809935760122, "ground_truth": 0}, {"key": "15159017", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06278920996337495, "ground_truth": 0}, {"key": "15159017", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027066174890745164, "ground_truth": 0}, {"key": "15159017", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06754669234043767, "ground_truth": 0}, {"key": "15159017", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03102617981328514, "ground_truth": 0}, {"key": "24493400", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35398630731043057, "ground_truth": 0}, {"key": "24493400", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.48828340487068983, "ground_truth": 0}, {"key": "24493400", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4282333981679986, "ground_truth": 0}, {"key": "24493400", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408767396617, "ground_truth": 0}, {"key": "24493400", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408896922099, "ground_truth": 0}, {"key": "37791071", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07807815939035366, "ground_truth": 0}, {"key": "37791071", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07696083997877569, "ground_truth": 0}, {"key": "37791071", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13753247416666478, "ground_truth": 0}, {"key": "37791071", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418565516346, "ground_truth": 0}, {"key": "37791071", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15507847105822647, "ground_truth": 0}, {"key": "33528627", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07640767975412616, "ground_truth": 0}, {"key": "33528627", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07892587892819995, "ground_truth": 0}, {"key": "33528627", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06730107702839484, "ground_truth": 0}, {"key": "33528627", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11920292185421369, "ground_truth": 0}, {"key": "33528627", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14755518373087942, "ground_truth": 0}, {"key": "39925662", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10594828033501083, "ground_truth": 0}, {"key": "39925662", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.060529388769481426, "ground_truth": 0}, {"key": "39925662", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.055617609653546035, "ground_truth": 0}, {"key": "39925662", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03718677511825495, "ground_truth": 0}, {"key": "39925662", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.038610930302666886, "ground_truth": 0}, {"key": "29213416", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19314737511041571, "ground_truth": 0}, {"key": "29213416", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09334687265831927, "ground_truth": 0}, {"key": "29213416", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21206880115250085, "ground_truth": 0}, {"key": "29213416", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09009299919821641, "ground_truth": 0}, {"key": "29213416", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798744469121026, "ground_truth": 0}, {"key": "34492745", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010860331633444754, "ground_truth": 0}, {"key": "34492745", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0030278351191508675, "ground_truth": 0}, {"key": "34492745", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.007066401120975316, "ground_truth": 0}, {"key": "34492745", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02245705601790341, "ground_truth": 0}, {"key": "34492745", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016979990953842075, "ground_truth": 0}, {"key": "34191937", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.045352579873637854, "ground_truth": 0}, {"key": "34191937", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03775027516096996, "ground_truth": 0}, {"key": "34191937", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10017222358654068, "ground_truth": 0}, {"key": "34191937", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.036083941472452606, "ground_truth": 0}, {"key": "34191937", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04603389863595503, "ground_truth": 0}, {"key": "34933372", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.055617612675466936, "ground_truth": 0}, {"key": "34933372", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0173756656098781, "ground_truth": 0}, {"key": "34933372", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.061875985630864244, "ground_truth": 0}, {"key": "34933372", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07133199677036164, "ground_truth": 0}, {"key": "34933372", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11085559735683795, "ground_truth": 0}, {"key": "38714379", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24580846491185823, "ground_truth": 0}, {"key": "38714379", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2173375172364734, "ground_truth": 0}, {"key": "38714379", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.186539227744873, "ground_truth": 0}, {"key": "38714379", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1505276201254797, "ground_truth": 0}, {"key": "38714379", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.148047183882611, "ground_truth": 0}, {"key": "39220660", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08945460043448303, "ground_truth": 0}, {"key": "39220660", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16238002211802183, "ground_truth": 0}, {"key": "39220660", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19498022666909273, "ground_truth": 0}, {"key": "39220660", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09073548182980086, "ground_truth": 0}, {"key": "39220660", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13477592510208666, "ground_truth": 0}, {"key": "41028780", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049039619577074436, "ground_truth": 0}, {"key": "41028780", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.010448625814660365, "ground_truth": 0}, {"key": "41028780", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0124797005445097, "ground_truth": 0}, {"key": "41028780", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05223085425938881, "ground_truth": 0}, {"key": "41028780", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.033589508872801085, "ground_truth": 0}, {"key": "39457108", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013376604489981021, "ground_truth": 0}, {"key": "39457108", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.002981032868189697, "ground_truth": 0}, {"key": "39457108", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01685007835076377, "ground_truth": 0}, {"key": "39457108", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016029147668366474, "ground_truth": 0}, {"key": "39457108", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016657039842092033, "ground_truth": 0}, {"key": "38288018", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4349412497863792, "ground_truth": 0}, {"key": "38288018", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.44552952798758777, "ground_truth": 0}, {"key": "38288018", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.40544871329804777, "ground_truth": 0}, {"key": "38288018", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404167054883713, "ground_truth": 0}, {"key": "38288018", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473403897679, "ground_truth": 0}, {"key": "40106293", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.025760561606859498, "ground_truth": 0}, {"key": "40106293", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13568954663690352, "ground_truth": 0}, {"key": "40106293", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.030675800203915173, "ground_truth": 0}, {"key": "40106293", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.039787806952787, "ground_truth": 0}, {"key": "40106293", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02898062833366883, "ground_truth": 0}, {"key": "39948797", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.051462763127567805, "ground_truth": 0}, {"key": "39948797", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10743747371341401, "ground_truth": 0}, {"key": "39948797", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10970577286880481, "ground_truth": 0}, {"key": "39948797", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10818895536701398, "ground_truth": 0}, {"key": "39948797", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07107367053795562, "ground_truth": 0}, {"key": "31853399", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049222118446068795, "ground_truth": 0}, {"key": "31853399", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.033211170393097775, "ground_truth": 0}, {"key": "31853399", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05561761245672891, "ground_truth": 0}, {"key": "31853399", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13341521628197464, "ground_truth": 0}, {"key": "31853399", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04161779381789832, "ground_truth": 0}, {"key": "35273252", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3566707061668449, "ground_truth": 0}, {"key": "35273252", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2829881198502087, "ground_truth": 0}, {"key": "35273252", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25091277714164995, "ground_truth": 0}, {"key": "35273252", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12852514381513533, "ground_truth": 0}, {"key": "35273252", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2575782741638082, "ground_truth": 0}, {"key": "37130459", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7772998507821508, "ground_truth": 0}, {"key": "37130459", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8238958757405694, "ground_truth": 0}, {"key": "37130459", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7931059430451463, "ground_truth": 0}, {"key": "37130459", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8692713126793717, "ground_truth": 0}, {"key": "37130459", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346161997549, "ground_truth": 0}, {"key": "21734003", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02423763454093048, "ground_truth": 0}, {"key": "21734003", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12765261963751562, "ground_truth": 0}, {"key": "21734003", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09877259249818443, "ground_truth": 0}, {"key": "21734003", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05033063376313446, "ground_truth": 0}, {"key": "21734003", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.025371310586744106, "ground_truth": 0}, {"key": "33990737", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013636836347511633, "ground_truth": 0}, {"key": "33990737", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.016277460434993903, "ground_truth": 0}, {"key": "33990737", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010408314753008175, "ground_truth": 0}, {"key": "33990737", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01840489037355835, "ground_truth": 0}, {"key": "33990737", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.034100425088826936, "ground_truth": 0}, {"key": "34559912", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05379964300956024, "ground_truth": 0}, {"key": "34559912", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05184546864564626, "ground_truth": 0}, {"key": "34559912", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.046033900888658726, "ground_truth": 0}, {"key": "34559912", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.054399318506606315, "ground_truth": 0}, {"key": "34559912", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06097518344806936, "ground_truth": 0}, {"key": "39820439", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05340333430154073, "ground_truth": 0}, {"key": "39820439", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.030214587715595726, "ground_truth": 0}, {"key": "39820439", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08694166205778564, "ground_truth": 0}, {"key": "39820439", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08151974906590198, "ground_truth": 0}, {"key": "39820439", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15817434345980647, "ground_truth": 0}, {"key": "34759328", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.057493275026550855, "ground_truth": 0}, {"key": "34759328", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1403362589338965, "ground_truth": 0}, {"key": "34759328", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04672495623288704, "ground_truth": 0}, {"key": "34759328", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903529661003112, "ground_truth": 0}, {"key": "34759328", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13432104637893616, "ground_truth": 0}, {"key": "36939137", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23510839020844354, "ground_truth": 0}, {"key": "36939137", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2751297209113454, "ground_truth": 0}, {"key": "36939137", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4301473597084389, "ground_truth": 0}, {"key": "36939137", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158250450756045, "ground_truth": 0}, {"key": "36939137", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320633863847447, "ground_truth": 0}, {"key": "35851522", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.018264278444937443, "ground_truth": 0}, {"key": "35851522", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03803509529571026, "ground_truth": 0}, {"key": "35851522", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.044348579223701855, "ground_truth": 0}, {"key": "35851522", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04958902343464797, "ground_truth": 0}, {"key": "35851522", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.013325148403409658, "ground_truth": 0}, {"key": "22412782", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09982065925375236, "ground_truth": 0}, {"key": "22412782", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10706345607753219, "ground_truth": 0}, {"key": "22412782", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05165378456969184, "ground_truth": 0}, {"key": "22412782", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11162799197692674, "ground_truth": 0}, {"key": "22412782", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220563705016407, "ground_truth": 0}, {"key": "38579227", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3363310460277865, "ground_truth": 0}, {"key": "38579227", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.236516247748348, "ground_truth": 0}, {"key": "38579227", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19930801116528413, "ground_truth": 0}, {"key": "38579227", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894316102553, "ground_truth": 0}, {"key": "38579227", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.25683200397755596, "ground_truth": 0}, {"key": "37206995", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16291204397665637, "ground_truth": 0}, {"key": "37206995", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3593641436387997, "ground_truth": 0}, {"key": "37206995", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22270014071491273, "ground_truth": 0}, {"key": "37206995", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364246356922675, "ground_truth": 0}, {"key": "37206995", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31405055459685827, "ground_truth": 0}, {"key": "38700847", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7279754794212081, "ground_truth": 0}, {"key": "38700847", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13660840046881767, "ground_truth": 0}, {"key": "38700847", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5755879832180594, "ground_truth": 0}, {"key": "38700847", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093790366407, "ground_truth": 0}, {"key": "38700847", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764820010511, "ground_truth": 0}, {"key": "20246590", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8962513684563457, "ground_truth": 0}, {"key": "20246590", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.879146773198907, "ground_truth": 0}, {"key": "20246590", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8169911607813956, "ground_truth": 0}, {"key": "20246590", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9230391641292288, "ground_truth": 0}, {"key": "20246590", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7000752659967485, "ground_truth": 0}, {"key": "39141360", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22815651386369057, "ground_truth": 0}, {"key": "39141360", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11047115072712851, "ground_truth": 0}, {"key": "39141360", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16995624301374063, "ground_truth": 0}, {"key": "39141360", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922078736058926, "ground_truth": 0}, {"key": "39141360", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14223189354393873, "ground_truth": 0}, {"key": "37906226", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13660839833622965, "ground_truth": 0}, {"key": "37906226", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02153287743720034, "ground_truth": 0}, {"key": "37906226", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04637821138634136, "ground_truth": 0}, {"key": "37906226", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03963884108956529, "ground_truth": 0}, {"key": "37906226", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027480693230466157, "ground_truth": 0}, {"key": "16201033", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.008348054335633218, "ground_truth": 0}, {"key": "16201033", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.024516336640737997, "ground_truth": 0}, {"key": "16201033", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.018546565519754, "ground_truth": 0}, {"key": "16201033", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.006438102523438727, "ground_truth": 0}, {"key": "16201033", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018124721423831078, "ground_truth": 0}, {"key": "36469022", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04778006817301108, "ground_truth": 0}, {"key": "36469022", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013171950685498361, "ground_truth": 0}, {"key": "36469022", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010944577558233404, "ground_truth": 0}, {"key": "36469022", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018833130429848494, "ground_truth": 0}, {"key": "36469022", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.022542967023378012, "ground_truth": 0}, {"key": "31295270", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07133200318332443, "ground_truth": 0}, {"key": "31295270", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.29017561882935805, "ground_truth": 0}, {"key": "31295270", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.147064532458419, "ground_truth": 0}, {"key": "31295270", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866938567249125, "ground_truth": 0}, {"key": "31295270", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09401018596216935, "ground_truth": 0}, {"key": "35360689", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028544152267974646, "ground_truth": 0}, {"key": "35360689", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0057302471711111625, "ground_truth": 0}, {"key": "35360689", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0035243411792189824, "ground_truth": 0}, {"key": "35360689", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0044683847197353145, "ground_truth": 0}, {"key": "35360689", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.009746103663515289, "ground_truth": 0}, {"key": "29202793", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09501304571830926, "ground_truth": 0}, {"key": "29202793", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1721718525034493, "ground_truth": 0}, {"key": "29202793", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06779313874083784, "ground_truth": 0}, {"key": "29202793", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0946777012405971, "ground_truth": 0}, {"key": "29202793", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.061875987422813535, "ground_truth": 0}, {"key": "35999008", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014957086390379945, "ground_truth": 0}, {"key": "35999008", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012576348237781884, "ground_truth": 0}, {"key": "35999008", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01730909700597677, "ground_truth": 0}, {"key": "35999008", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022802637161258323, "ground_truth": 0}, {"key": "35999008", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012821214131065982, "ground_truth": 0}, {"key": "31797119", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16559311930318205, "ground_truth": 0}, {"key": "31797119", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0616496193496721, "ground_truth": 0}, {"key": "31797119", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16451645473572815, "ground_truth": 0}, {"key": "31797119", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128141513288542, "ground_truth": 0}, {"key": "31797119", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10374862787659327, "ground_truth": 0}, {"key": "26711893", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1250653878265081, "ground_truth": 0}, {"key": "26711893", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.041152887453940565, "ground_truth": 0}, {"key": "26711893", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2991052042906592, "ground_truth": 0}, {"key": "26711893", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447732004172468, "ground_truth": 0}, {"key": "26711893", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0863234802278526, "ground_truth": 0}, {"key": "35348288", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.012431650484276257, "ground_truth": 0}, {"key": "35348288", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017917344732318406, "ground_truth": 0}, {"key": "35348288", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010735162611556423, "ground_truth": 0}, {"key": "35348288", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.017242776445139607, "ground_truth": 0}, {"key": "35348288", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024798161666191906, "ground_truth": 0}, {"key": "38124131", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03541072983588309, "ground_truth": 0}, {"key": "38124131", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.024798159872033286, "ground_truth": 0}, {"key": "38124131", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026255300089736748, "ground_truth": 0}, {"key": "38124131", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016850079124047818, "ground_truth": 0}, {"key": "38124131", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757214023036261, "ground_truth": 0}, {"key": "20285901", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1470645303019328, "ground_truth": 0}, {"key": "20285901", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1490353009689827, "ground_truth": 0}, {"key": "20285901", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2133771681844449, "ground_truth": 0}, {"key": "20285901", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4707365997298913, "ground_truth": 0}, {"key": "20285901", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730021915335, "ground_truth": 0}, {"key": "35633632", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08093671431297517, "ground_truth": 0}, {"key": "35633632", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06853749276810522, "ground_truth": 0}, {"key": "35633632", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05623634636341082, "ground_truth": 0}, {"key": "35633632", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0035796425288283588, "ground_truth": 0}, {"key": "35633632", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1772405258419372, "ground_truth": 0}, {"key": "10741274", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6893056050394482, "ground_truth": 0}, {"key": "10741274", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.84389509796671, "ground_truth": 0}, {"key": "10741274", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7371581569881493, "ground_truth": 0}, {"key": "10741274", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.906653121707592, "ground_truth": 0}, {"key": "10741274", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.453261854054475, "ground_truth": 0}, {"key": "30605795", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12852513329463172, "ground_truth": 0}, {"key": "30605795", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1167640129390875, "ground_truth": 0}, {"key": "30605795", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07640768399568272, "ground_truth": 0}, {"key": "30605795", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106118038642074, "ground_truth": 0}, {"key": "30605795", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15921740075735002, "ground_truth": 0}, {"key": "30539722", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14903530428006878, "ground_truth": 0}, {"key": "30539722", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18242553232954978, "ground_truth": 0}, {"key": "30539722", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09602549164399204, "ground_truth": 0}, {"key": "30539722", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07751766129764254, "ground_truth": 0}, {"key": "30539722", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.290980865686899, "ground_truth": 0}, {"key": "18639299", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16184942838647706, "ground_truth": 0}, {"key": "18639299", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07185126609152338, "ground_truth": 0}, {"key": "18639299", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07343005077470449, "ground_truth": 0}, {"key": "18639299", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1613202363817047, "ground_truth": 0}, {"key": "18639299", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0869416620329357, "ground_truth": 0}, {"key": "39773552", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12549345435537235, "ground_truth": 0}, {"key": "39773552", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14128141730834384, "ground_truth": 0}, {"key": "39773552", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08850466586568745, "ground_truth": 0}, {"key": "39773552", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08882029005559117, "ground_truth": 0}, {"key": "39773552", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09534946563801497, "ground_truth": 0}, {"key": "34086410", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08151975004894292, "ground_truth": 0}, {"key": "34086410", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017848737479228667, "ground_truth": 0}, {"key": "34086410", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.043528141020033884, "ground_truth": 0}, {"key": "34086410", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018546564637137414, "ground_truth": 0}, {"key": "34086410", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.048316069232183574, "ground_truth": 0}, {"key": "35454652", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028220986091804737, "ground_truth": 0}, {"key": "35454652", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04240382842836395, "ground_truth": 0}, {"key": "35454652", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012147171461338886, "ground_truth": 0}, {"key": "35454652", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03321117028386956, "ground_truth": 0}, {"key": "35454652", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03581319385536625, "ground_truth": 0}, {"key": "36158310", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03333682459905123, "ground_truth": 0}, {"key": "36158310", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013480103898661522, "ground_truth": 0}, {"key": "36158310", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.059428218808102375, "ground_truth": 0}, {"key": "36158310", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.028220986817874487, "ground_truth": 0}, {"key": "36158310", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.037892425121669564, "ground_truth": 0}, {"key": "35688387", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014392337028333878, "ground_truth": 0}, {"key": "35688387", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07779745218079173, "ground_truth": 0}, {"key": "35688387", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.022715756149476483, "ground_truth": 0}, {"key": "35688387", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03222229796669259, "ground_truth": 0}, {"key": "35688387", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03138043031133139, "ground_truth": 0}, {"key": "34209292", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22609940128163789, "ground_truth": 0}, {"key": "34209292", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.061649619553264604, "ground_truth": 0}, {"key": "34209292", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13799646728481307, "ground_truth": 0}, {"key": "34209292", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07107366353239414, "ground_truth": 0}, {"key": "34209292", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07343005372874356, "ground_truth": 0}, {"key": "25037859", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.029760093326204613, "ground_truth": 0}, {"key": "25037859", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07807815899219558, "ground_truth": 0}, {"key": "25037859", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10017221837403617, "ground_truth": 0}, {"key": "25037859", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04385456583067515, "ground_truth": 0}, {"key": "25037859", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04038906885940737, "ground_truth": 0}, {"key": "36412121", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.051845470145388824, "ground_truth": 0}, {"key": "36412121", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.027901376763770382, "ground_truth": 0}, {"key": "36412121", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01704531692729027, "ground_truth": 0}, {"key": "36412121", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0446808730171076, "ground_truth": 0}, {"key": "36412121", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02576056025266447, "ground_truth": 0}, {"key": "34909172", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11201595982900184, "ground_truth": 0}, {"key": "34909172", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25534365093015554, "ground_truth": 0}, {"key": "34909172", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1089450410952185, "ground_truth": 0}, {"key": "34909172", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.247987440499188, "ground_truth": 0}, {"key": "34909172", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13386749629121203, "ground_truth": 0}, {"key": "39011806", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23022675741792267, "ground_truth": 0}, {"key": "39011806", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5736784263215737, "ground_truth": 0}, {"key": "39011806", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5078118772718878, "ground_truth": 0}, {"key": "39011806", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5917232449182147, "ground_truth": 0}, {"key": "39011806", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633105972772737, "ground_truth": 0}, {"key": "33096163", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2877678136382741, "ground_truth": 0}, {"key": "33096163", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09334687596989165, "ground_truth": 0}, {"key": "33096163", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15713686048595296, "ground_truth": 0}, {"key": "33096163", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.111241217134779, "ground_truth": 0}, {"key": "33096163", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09073549111455745, "ground_truth": 0}, {"key": "38762205", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02790137656069319, "ground_truth": 0}, {"key": "38762205", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026657740536349395, "ground_truth": 0}, {"key": "38762205", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.043204030626175526, "ground_truth": 0}, {"key": "38762205", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07185127087304635, "ground_truth": 0}, {"key": "38762205", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04434858188208507, "ground_truth": 0}, {"key": "35519177", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05165378614734072, "ground_truth": 0}, {"key": "35519177", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01778039007244977, "ground_truth": 0}, {"key": "35519177", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06052939033085699, "ground_truth": 0}, {"key": "35519177", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05602938436475853, "ground_truth": 0}, {"key": "35519177", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09670578662877787, "ground_truth": 0}, {"key": "36192531", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11124120896578989, "ground_truth": 0}, {"key": "36192531", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18242552590556366, "ground_truth": 0}, {"key": "36192531", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06233103941037565, "ground_truth": 0}, {"key": "36192531", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981165168271926, "ground_truth": 0}, {"key": "36192531", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.27669054460023235, "ground_truth": 0}, {"key": "33160852", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36840571261129473, "ground_truth": 0}, {"key": "33160852", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7641884218967595, "ground_truth": 0}, {"key": "33160852", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.542863271059041, "ground_truth": 0}, {"key": "33160852", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.45229400228101607, "ground_truth": 0}, {"key": "33160852", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984286808498, "ground_truth": 0}, {"key": "36312304", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06325052227500468, "ground_truth": 0}, {"key": "36312304", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06804041952951247, "ground_truth": 0}, {"key": "36312304", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.054198728195495365, "ground_truth": 0}, {"key": "36312304", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.011687256834493101, "ground_truth": 0}, {"key": "36312304", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07585818035340613, "ground_truth": 0}, {"key": "33773343", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08819004662012336, "ground_truth": 0}, {"key": "33773343", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1074374702609075, "ground_truth": 0}, {"key": "33773343", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.043691057564812154, "ground_truth": 0}, {"key": "33773343", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0809367140268341, "ground_truth": 0}, {"key": "33773343", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.058776561599332686, "ground_truth": 0}, {"key": "34913320", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.040845720110241346, "ground_truth": 0}, {"key": "34913320", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02585877638370227, "ground_truth": 0}, {"key": "34913320", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.039937315582160356, "ground_truth": 0}, {"key": "34913320", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.047425873203262456, "ground_truth": 0}, {"key": "34913320", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1530421555490187, "ground_truth": 0}, {"key": "33784155", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1015894513243372, "ground_truth": 0}, {"key": "33784155", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12808823983846968, "ground_truth": 0}, {"key": "33784155", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11920291457357034, "ground_truth": 0}, {"key": "33784155", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06560483138742898, "ground_truth": 0}, {"key": "33784155", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0987725901674481, "ground_truth": 0}, {"key": "24085062", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.747615980821931, "ground_truth": 0}, {"key": "24085062", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.661922887153361, "ground_truth": 0}, {"key": "24085062", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7264256212614664, "ground_truth": 0}, {"key": "24085062", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346225131631, "ground_truth": 0}, {"key": "24085062", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191338257634, "ground_truth": 0}, {"key": "33893487", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.004810983139463123, "ground_truth": 0}, {"key": "33893487", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0029121781408147493, "ground_truth": 0}, {"key": "33893487", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.023689471123327165, "ground_truth": 0}, {"key": "33893487", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0036928528186152606, "ground_truth": 0}, {"key": "33893487", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0058881592690269244, "ground_truth": 0}, {"key": "40913011", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10338596346666999, "ground_truth": 0}, {"key": "40913011", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09534945971258148, "ground_truth": 0}, {"key": "40913011", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08240150896630054, "ground_truth": 0}, {"key": "40913011", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279540030950572, "ground_truth": 0}, {"key": "40913011", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0558231407766078, "ground_truth": 0}, {"key": "29642545", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.286169265376639, "ground_truth": 0}, {"key": "29642545", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1320661549209859, "ground_truth": 0}, {"key": "29642545", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09203286004634902, "ground_truth": 0}, {"key": "29642545", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337716154721043, "ground_truth": 0}, {"key": "29642545", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1225232103247894, "ground_truth": 0}, {"key": "35969159", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2689414338007653, "ground_truth": 0}, {"key": "35969159", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12678516625769334, "ground_truth": 0}, {"key": "35969159", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06560483395065837, "ground_truth": 0}, {"key": "35969159", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002882524256936, "ground_truth": 0}, {"key": "35969159", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07921032064823916, "ground_truth": 0}, {"key": "37081669", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.019719127846806624, "ground_truth": 0}, {"key": "37081669", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.104843366001405, "ground_truth": 0}, {"key": "37081669", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06903793010440032, "ground_truth": 0}, {"key": "37081669", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12808824947673036, "ground_truth": 0}, {"key": "37081669", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08819004778252881, "ground_truth": 0}, {"key": "40048022", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03308597938155548, "ground_truth": 0}, {"key": "40048022", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17895589610389911, "ground_truth": 0}, {"key": "40048022", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04885778073006128, "ground_truth": 0}, {"key": "40048022", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05541279378109528, "ground_truth": 0}, {"key": "40048022", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.042087729456484944, "ground_truth": 0}, {"key": "32884004", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1417559966580212, "ground_truth": 0}, {"key": "32884004", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.161849423759401, "ground_truth": 0}, {"key": "32884004", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0991208541260019, "ground_truth": 0}, {"key": "32884004", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04778007044556747, "ground_truth": 0}, {"key": "32884004", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05877655725961205, "ground_truth": 0}, {"key": "39022490", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36477756649259313, "ground_truth": 0}, {"key": "39022490", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.46490159273773063, "ground_truth": 0}, {"key": "39022490", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5888891366407586, "ground_truth": 0}, {"key": "39022490", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474603025121934, "ground_truth": 0}, {"key": "39022490", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398859127721, "ground_truth": 0}, {"key": "35159385", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010368156768254061, "ground_truth": 0}, {"key": "35159385", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01826427830234427, "ground_truth": 0}, {"key": "35159385", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.011244560645326012, "ground_truth": 0}, {"key": "35159385", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020645931069776448, "ground_truth": 0}, {"key": "35159385", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018264277990918187, "ground_truth": 0}, {"key": "34363669", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03185885730779709, "ground_truth": 0}, {"key": "34363669", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017045317294284615, "ground_truth": 0}, {"key": "34363669", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.028652669921563637, "ground_truth": 0}, {"key": "34363669", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04069295342538302, "ground_truth": 0}, {"key": "34363669", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.019124038477883378, "ground_truth": 0}, {"key": "36119687", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07477004725924342, "ground_truth": 0}, {"key": "36119687", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.047602657862979215, "ground_truth": 0}, {"key": "36119687", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12421300290242895, "ground_truth": 0}, {"key": "36119687", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10230470372584417, "ground_truth": 0}, {"key": "36119687", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18359363093640985, "ground_truth": 0}, {"key": "35217446", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.011201214097142668, "ground_truth": 0}, {"key": "35217446", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05165378313797854, "ground_truth": 0}, {"key": "35217446", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010408314571384233, "ground_truth": 0}, {"key": "35217446", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01186912101084743, "ground_truth": 0}, {"key": "35217446", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03044434924122879, "ground_truth": 0}, {"key": "39049331", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11516223395497405, "ground_truth": 0}, {"key": "39049331", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20689405601082037, "ground_truth": 0}, {"key": "39049331", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11476477612931611, "ground_truth": 0}, {"key": "39049331", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07396337330703541, "ground_truth": 0}, {"key": "39049331", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580130448362, "ground_truth": 0}, {"key": "36472242", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.046724955436315954, "ground_truth": 0}, {"key": "36472242", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08064661530033333, "ground_truth": 0}, {"key": "36472242", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08601587858818273, "ground_truth": 0}, {"key": "36472242", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1097057716560268, "ground_truth": 0}, {"key": "36472242", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07531230960716885, "ground_truth": 0}, {"key": "31854721", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04304284999445502, "ground_truth": 0}, {"key": "31854721", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06853749490021745, "ground_truth": 0}, {"key": "31854721", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09534946007372737, "ground_truth": 0}, {"key": "31854721", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08389038633191234, "ground_truth": 0}, {"key": "31854721", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.053601141856543966, "ground_truth": 0}, {"key": "18725849", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10743747337122551, "ground_truth": 0}, {"key": "18725849", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10557884238158458, "ground_truth": 0}, {"key": "18725849", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14128142300293797, "ground_truth": 0}, {"key": "18725849", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08151975241829244, "ground_truth": 0}, {"key": "18725849", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08509904462433218, "ground_truth": 0}, {"key": "36883179", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04304284694473534, "ground_truth": 0}, {"key": "36883179", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06656918698080022, "ground_truth": 0}, {"key": "36883179", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0450155309746063, "ground_truth": 0}, {"key": "36883179", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05460060606136951, "ground_truth": 0}, {"key": "36883179", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024798161944105505, "ground_truth": 0}, {"key": "34266359", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2351083828411479, "ground_truth": 0}, {"key": "34266359", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2751297290436757, "ground_truth": 0}, {"key": "34266359", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19498021190780487, "ground_truth": 0}, {"key": "34266359", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921740775010068, "ground_truth": 0}, {"key": "34266359", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2220246788866356, "ground_truth": 0}, {"key": "31920289", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2743513513442343, "ground_truth": 0}, {"key": "31920289", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20946968941074603, "ground_truth": 0}, {"key": "31920289", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4205995968628243, "ground_truth": 0}, {"key": "31920289", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268348275314603, "ground_truth": 0}, {"key": "31920289", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3140505676039046, "ground_truth": 0}, {"key": "36292997", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.026355353504988552, "ground_truth": 0}, {"key": "36292997", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017442485832532446, "ground_truth": 0}, {"key": "36292997", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03760863471644851, "ground_truth": 0}, {"key": "36292997", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.038321972973713175, "ground_truth": 0}, {"key": "36292997", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01798621062973112, "ground_truth": 0}, {"key": "30412533", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04586266234778057, "ground_truth": 0}, {"key": "30412533", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1384617997589785, "ground_truth": 0}, {"key": "30412533", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09947020683091633, "ground_truth": 0}, {"key": "30412533", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.028544151037008733, "ground_truth": 0}, {"key": "30412533", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06325052108675375, "ground_truth": 0}, {"key": "40433191", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17724050651609488, "ground_truth": 0}, {"key": "40433191", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15843459583062644, "ground_truth": 0}, {"key": "40433191", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1937568723434537, "ground_truth": 0}, {"key": "40433191", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256487209278, "ground_truth": 0}, {"key": "40433191", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14706452590068028, "ground_truth": 0}, {"key": "34565591", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02822098683748067, "ground_truth": 0}, {"key": "34565591", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08945459678534011, "ground_truth": 0}, {"key": "34565591", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.039638839671776636, "ground_truth": 0}, {"key": "34565591", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0736962726933824, "ground_truth": 0}, {"key": "34565591", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07751765348708073, "ground_truth": 0}, {"key": "36062480", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04352814070679038, "ground_truth": 0}, {"key": "36062480", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06301947594963159, "ground_truth": 0}, {"key": "36062480", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04603390203878443, "ground_truth": 0}, {"key": "36062480", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09401018015185247, "ground_truth": 0}, {"key": "36062480", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05184547038258385, "ground_truth": 0}, {"key": "37276883", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3477585711267701, "ground_truth": 0}, {"key": "37276883", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20181321843581798, "ground_truth": 0}, {"key": "37276883", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4339814856945152, "ground_truth": 0}, {"key": "37276883", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684560129431457, "ground_truth": 0}, {"key": "37276883", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398627055965, "ground_truth": 0}, {"key": "38509260", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049222115238356436, "ground_truth": 0}, {"key": "38509260", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.015603534174547538, "ground_truth": 0}, {"key": "38509260", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03358950582123063, "ground_truth": 0}, {"key": "38509260", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030675798905084112, "ground_truth": 0}, {"key": "38509260", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04867656985361769, "ground_truth": 0}, {"key": "37139607", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3311197350127636, "ground_truth": 0}, {"key": "37139607", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.30074560589700555, "ground_truth": 0}, {"key": "37139607", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2133771669027101, "ground_truth": 0}, {"key": "37139607", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3354596714471903, "ground_truth": 0}, {"key": "37139607", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23581159595873405, "ground_truth": 0}, {"key": "37092824", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2206781613754584, "ground_truth": 0}, {"key": "37092824", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3398276154678225, "ground_truth": 0}, {"key": "37092824", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29259530570717085, "ground_truth": 0}, {"key": "37092824", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552952416590663, "ground_truth": 0}, {"key": "37092824", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23440664574599918, "ground_truth": 0}, {"key": "32191802", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10743747884098613, "ground_truth": 0}, {"key": "32191802", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6495786089449098, "ground_truth": 0}, {"key": "32191802", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5813030633850347, "ground_truth": 0}, {"key": "32191802", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168781707264267, "ground_truth": 0}, {"key": "32191802", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328820124917088, "ground_truth": 0}, {"key": "39396038", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04208772984475649, "ground_truth": 0}, {"key": "39396038", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11797801871930841, "ground_truth": 0}, {"key": "39396038", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07531230374174709, "ground_truth": 0}, {"key": "39396038", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09105828151714557, "ground_truth": 0}, {"key": "39396038", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0703038461249123, "ground_truth": 0}, {"key": "39076884", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07081620063953496, "ground_truth": 0}, {"key": "39076884", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.042087729142418144, "ground_truth": 0}, {"key": "39076884", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06441766695482844, "ground_truth": 0}, {"key": "39076884", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04146227642123158, "ground_truth": 0}, {"key": "39076884", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03690806681566035, "ground_truth": 0}, {"key": "27763432", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.018689307650258644, "ground_truth": 0}, {"key": "27763432", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012970386753313587, "ground_truth": 0}, {"key": "27763432", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.011552671816224344, "ground_truth": 0}, {"key": "27763432", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008511302989062967, "ground_truth": 0}, {"key": "27763432", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.00997492192175487, "ground_truth": 0}, {"key": "37806929", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.37022539416549294, "ground_truth": 0}, {"key": "37806929", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.47852884336011237, "ground_truth": 0}, {"key": "37806929", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6477982177880832, "ground_truth": 0}, {"key": "37806929", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015679102083, "ground_truth": 0}, {"key": "37806929", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936413834008407, "ground_truth": 0}, {"key": "32334186", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08269734035677406, "ground_truth": 0}, {"key": "32334186", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0826973417394831, "ground_truth": 0}, {"key": "32334186", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.029760093764950146, "ground_truth": 0}, {"key": "32334186", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03978781018728711, "ground_truth": 0}, {"key": "32334186", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02800751972414295, "ground_truth": 0}, {"key": "36187324", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1334152123134649, "ground_truth": 0}, {"key": "36187324", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08570927117308755, "ground_truth": 0}, {"key": "36187324", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05686155271390568, "ground_truth": 0}, {"key": "36187324", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08725224514855746, "ground_truth": 0}, {"key": "36187324", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04977344839203548, "ground_truth": 0}, {"key": "35306009", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0402379433355064, "ground_truth": 0}, {"key": "35306009", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.052037823766476456, "ground_truth": 0}, {"key": "35306009", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05340333495000893, "ground_truth": 0}, {"key": "35306009", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263670446068544, "ground_truth": 0}, {"key": "35306009", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.062331038807790444, "ground_truth": 0}, {"key": "39490050", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01826427850384249, "ground_truth": 0}, {"key": "39490050", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12252321241230837, "ground_truth": 0}, {"key": "39490050", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0492221152359616, "ground_truth": 0}, {"key": "39490050", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02237145833476957, "ground_truth": 0}, {"key": "39490050", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06097518090337903, "ground_truth": 0}, {"key": "38072149", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.006241259966482823, "ground_truth": 0}, {"key": "38072149", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01771229911078415, "ground_truth": 0}, {"key": "38072149", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.007968814505106142, "ground_truth": 0}, {"key": "38072149", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03210070931163295, "ground_truth": 0}, {"key": "38072149", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04146227450545647, "ground_truth": 0}, {"key": "35899689", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24077459483475944, "ground_truth": 0}, {"key": "35899689", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19868535292948922, "ground_truth": 0}, {"key": "35899689", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10594828151980007, "ground_truth": 0}, {"key": "35899689", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055769287514727, "ground_truth": 0}, {"key": "35899689", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15765489435400434, "ground_truth": 0}, {"key": "27994518", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7295197735716313, "ground_truth": 0}, {"key": "27994518", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1403362491075491, "ground_truth": 0}, {"key": "27994518", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5774953779960539, "ground_truth": 0}, {"key": "27994518", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193278777884878, "ground_truth": 0}, {"key": "27994518", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195270984332, "ground_truth": 0}, {"key": "10615479", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11397345731434806, "ground_truth": 0}, {"key": "10615479", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.015483987919196602, "ground_truth": 0}, {"key": "10615479", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09877259451858673, "ground_truth": 0}, {"key": "10615479", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10594828106014455, "ground_truth": 0}, {"key": "10615479", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07640767993616521, "ground_truth": 0}, {"key": "40186667", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031026179456005477, "ground_truth": 0}, {"key": "40186667", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012673735651574935, "ground_truth": 0}, {"key": "40186667", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027585282951484488, "ground_truth": 0}, {"key": "40186667", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05223085717847106, "ground_truth": 0}, {"key": "40186667", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012970387574307537, "ground_truth": 0}, {"key": "38622886", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05541279134647376, "ground_truth": 0}, {"key": "38622886", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0037217086918710563, "ground_truth": 0}, {"key": "38622886", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04130730508016858, "ground_truth": 0}, {"key": "38622886", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05500528694579994, "ground_truth": 0}, {"key": "38622886", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023065225025508073, "ground_truth": 0}, {"key": "40686943", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13028542587765418, "ground_truth": 0}, {"key": "40686943", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14033625753455076, "ground_truth": 0}, {"key": "40686943", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19806417593241246, "ground_truth": 0}, {"key": "40686943", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1847675115401635, "ground_truth": 0}, {"key": "40686943", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09203286323205538, "ground_truth": 0}, {"key": "30604567", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.470736589620356, "ground_truth": 0}, {"key": "30604567", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.47073659874063933, "ground_truth": 0}, {"key": "30604567", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "30604567", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910862836406, "ground_truth": 0}, {"key": "30604567", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381510758239, "ground_truth": 0}, {"key": "35440903", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09534946144603539, "ground_truth": 0}, {"key": "35440903", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05070536341207083, "ground_truth": 0}, {"key": "35440903", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12765261643670392, "ground_truth": 0}, {"key": "35440903", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1320661547546601, "ground_truth": 0}, {"key": "35440903", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06903792874605928, "ground_truth": 0}, {"key": "37219533", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027169232193585666, "ground_truth": 0}, {"key": "37219533", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04958902280649708, "ground_truth": 0}, {"key": "37219533", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04586266402729997, "ground_truth": 0}, {"key": "37219533", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.044680869675601406, "ground_truth": 0}, {"key": "37219533", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1592174010877929, "ground_truth": 0}, {"key": "40178965", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028761588201447502, "ground_truth": 0}, {"key": "40178965", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.027795625178302807, "ground_truth": 0}, {"key": "40178965", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04903962276232983, "ground_truth": 0}, {"key": "40178965", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008577485562649357, "ground_truth": 0}, {"key": "40178965", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012673736070907491, "ground_truth": 0}, {"key": "13750468", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14033624782542742, "ground_truth": 0}, {"key": "13750468", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.26971013116740944, "ground_truth": 0}, {"key": "13750468", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09947021338155322, "ground_truth": 0}, {"key": "13750468", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991052104586716, "ground_truth": 0}, {"key": "13750468", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925953242979812, "ground_truth": 0}, {"key": "17754949", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.28937170199902124, "ground_truth": 0}, {"key": "17754949", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25832597462959045, "ground_truth": 0}, {"key": "17754949", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6495786220216934, "ground_truth": 0}, {"key": "17754949", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102717054133, "ground_truth": 0}, {"key": "17754949", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850304962052, "ground_truth": 0}, {"key": "36675623", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19868533868946536, "ground_truth": 0}, {"key": "36675623", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18010666592165345, "ground_truth": 0}, {"key": "36675623", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.036769465974227304, "ground_truth": 0}, {"key": "36675623", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263671051441939, "ground_truth": 0}, {"key": "36675623", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12506537892869216, "ground_truth": 0}, {"key": "40035440", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13614831758947754, "ground_truth": 0}, {"key": "40035440", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.058560824713381296, "ground_truth": 0}, {"key": "40035440", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06681232843379763, "ground_truth": 0}, {"key": "40035440", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08419108456796966, "ground_truth": 0}, {"key": "40035440", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1204388114166811, "ground_truth": 0}, {"key": "37685909", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09534946512277587, "ground_truth": 0}, {"key": "37685909", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10594827469014124, "ground_truth": 0}, {"key": "37685909", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09739039695368393, "ground_truth": 0}, {"key": "37685909", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203224392620715, "ground_truth": 0}, {"key": "37685909", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05261895716817042, "ground_truth": 0}, {"key": "36938787", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6566582902211325, "ground_truth": 0}, {"key": "36938787", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.627038155426454, "ground_truth": 0}, {"key": "36938787", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8080672231598123, "ground_truth": 0}, {"key": "36938787", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185944219388039, "ground_truth": 0}, {"key": "36938787", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307690395943, "ground_truth": 0}, {"key": "39398068", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.009020280327510012, "ground_truth": 0}, {"key": "39398068", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0072890776451245655, "ground_truth": 0}, {"key": "39398068", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.022032264699100246, "ground_truth": 0}, {"key": "39398068", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.010611421048634878, "ground_truth": 0}, {"key": "39398068", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.010529712085248567, "ground_truth": 0}, {"key": "39926408", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13386749009698706, "ground_truth": 0}, {"key": "39926408", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16132024628136699, "ground_truth": 0}, {"key": "39926408", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24508500865322583, "ground_truth": 0}, {"key": "39926408", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601152170057744, "ground_truth": 0}, {"key": "39926408", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1175721364950537, "ground_truth": 0}, {"key": "40465336", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.39420094232177516, "ground_truth": 0}, {"key": "40465336", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3328523469469852, "ground_truth": 0}, {"key": "40465336", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.34687309744569866, "ground_truth": 0}, {"key": "40465336", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381299469675, "ground_truth": 0}, {"key": "40465336", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013782101797, "ground_truth": 0}, {"key": "34173549", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6469064768564637, "ground_truth": 0}, {"key": "34173549", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.809275973291061, "ground_truth": 0}, {"key": "34173549", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6766198946527563, "ground_truth": 0}, {"key": "34173549", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942262413701, "ground_truth": 0}, {"key": "34173549", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8591918309050677, "ground_truth": 0}, {"key": "33541535", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04434857895532575, "ground_truth": 0}, {"key": "33541535", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03371653817871144, "ground_truth": 0}, {"key": "33541535", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11240507339710791, "ground_truth": 0}, {"key": "33541535", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06730108048745079, "ground_truth": 0}, {"key": "33541535", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14318771575279512, "ground_truth": 0}, {"key": "35685195", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02909075668105462, "ground_truth": 0}, {"key": "35685195", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.055617614443445804, "ground_truth": 0}, {"key": "35685195", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026963500334928746, "ground_truth": 0}, {"key": "35685195", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03904829078863694, "ground_truth": 0}, {"key": "35685195", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03410042779318055, "ground_truth": 0}, {"key": "28440730", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09268777253442975, "ground_truth": 0}, {"key": "28440730", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15610490612559372, "ground_truth": 0}, {"key": "28440730", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.33633105110934997, "ground_truth": 0}, {"key": "28440730", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930800855956962, "ground_truth": 0}, {"key": "28440730", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24653334169906263, "ground_truth": 0}, {"key": "38338714", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.48242910285444535, "ground_truth": 0}, {"key": "38338714", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "38338714", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.47657965715307843, "ground_truth": 0}, {"key": "38338714", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765075578459, "ground_truth": 0}, {"key": "38338714", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.331985496062602, "ground_truth": 0}, {"key": "32191881", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21866939008396413, "ground_truth": 0}, {"key": "32191881", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12765262401912678, "ground_truth": 0}, {"key": "32191881", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1699562368473419, "ground_truth": 0}, {"key": "32191881", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05146276620685065, "ground_truth": 0}, {"key": "32191881", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11879340184345374, "ground_truth": 0}, {"key": "37707251", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01697999250369989, "ground_truth": 0}, {"key": "37707251", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0446808737649819, "ground_truth": 0}, {"key": "37707251", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20753575632910876, "ground_truth": 0}, {"key": "37707251", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08756384366059257, "ground_truth": 0}, {"key": "37707251", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0963650986978452, "ground_truth": 0}, {"key": "40172567", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0863234794838162, "ground_truth": 0}, {"key": "40172567", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17106118612404672, "ground_truth": 0}, {"key": "40172567", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07504072502991982, "ground_truth": 0}, {"key": "40172567", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623156245918, "ground_truth": 0}, {"key": "40172567", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757212683010775, "ground_truth": 0}, {"key": "33113255", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06903792921401636, "ground_truth": 0}, {"key": "33113255", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1571368511364838, "ground_truth": 0}, {"key": "33113255", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23651623011077275, "ground_truth": 0}, {"key": "33113255", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07107366849068782, "ground_truth": 0}, {"key": "33113255", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302442344418167, "ground_truth": 0}, {"key": "33022143", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0453525785526551, "ground_truth": 0}, {"key": "33022143", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.021864557575161557, "ground_truth": 0}, {"key": "33022143", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.036220058530333346, "ground_truth": 0}, {"key": "33022143", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1104711548691237, "ground_truth": 0}, {"key": "33022143", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.045352577860898226, "ground_truth": 0}, {"key": "32084473", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1135795867715463, "ground_truth": 0}, {"key": "32084473", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08329192476769377, "ground_truth": 0}, {"key": "32084473", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0881900435443779, "ground_truth": 0}, {"key": "32084473", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05070536275244029, "ground_truth": 0}, {"key": "32084473", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03817827812838828, "ground_truth": 0}, {"key": "40564245", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04569203378651625, "ground_truth": 0}, {"key": "40564245", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2509127939510747, "ground_truth": 0}, {"key": "40564245", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12043881435973584, "ground_truth": 0}, {"key": "40564245", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447732404147715, "ground_truth": 0}, {"key": "40564245", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.42250462460529664, "ground_truth": 0}, {"key": "31717213", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16132024165122041, "ground_truth": 0}, {"key": "31717213", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08819004373327935, "ground_truth": 0}, {"key": "31717213", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12808823765912447, "ground_truth": 0}, {"key": "31717213", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08299415264972175, "ground_truth": 0}, {"key": "31717213", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1931473753404049, "ground_truth": 0}, {"key": "34861894", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05460060613426934, "ground_truth": 0}, {"key": "34861894", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.016593176306593696, "ground_truth": 0}, {"key": "34861894", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.049405246057670854, "ground_truth": 0}, {"key": "34861894", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021698100149171305, "ground_truth": 0}, {"key": "34861894", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03488088734322323, "ground_truth": 0}, {"key": "40838760", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.041152887771149935, "ground_truth": 0}, {"key": "40838760", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.010013570832585065, "ground_truth": 0}, {"key": "40838760", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.020804490393304897, "ground_truth": 0}, {"key": "40838760", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.017176709847646906, "ground_truth": 0}, {"key": "40838760", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03760863698296259, "ground_truth": 0}, {"key": "40044849", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32939170588647326, "ground_truth": 0}, {"key": "40044849", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08694165923194548, "ground_truth": 0}, {"key": "40044849", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4941408889610142, "ground_truth": 0}, {"key": "40044849", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516222956891196, "ground_truth": 0}, {"key": "40044849", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740213196065, "ground_truth": 0}, {"key": "30296116", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09138210827574758, "ground_truth": 0}, {"key": "30296116", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1666753992380003, "ground_truth": 0}, {"key": "30296116", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1320661504298374, "ground_truth": 0}, {"key": "30296116", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1613202451881822, "ground_truth": 0}, {"key": "30296116", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12678517239525752, "ground_truth": 0}, {"key": "34931360", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10743746876326153, "ground_truth": 0}, {"key": "34931360", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11279539890722998, "ground_truth": 0}, {"key": "34931360", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.031143831544979295, "ground_truth": 0}, {"key": "34931360", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08210662817089455, "ground_truth": 0}, {"key": "34931360", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0900929965085166, "ground_truth": 0}, {"key": "18862422", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014785407613436188, "ground_truth": 0}, {"key": "18862422", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019568675730436795, "ground_truth": 0}, {"key": "18862422", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01652955643241406, "ground_truth": 0}, {"key": "18862422", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013636836044810972, "ground_truth": 0}, {"key": "18862422", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018334452840383306, "ground_truth": 0}, {"key": "36361140", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3522017677942447, "ground_truth": 0}, {"key": "36361140", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3380771500794464, "ground_truth": 0}, {"key": "36361140", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3433417460212577, "ground_truth": 0}, {"key": "36361140", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22135068590641818, "ground_truth": 0}, {"key": "36361140", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633105609137404, "ground_truth": 0}, {"key": "39703329", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06954174397691175, "ground_truth": 0}, {"key": "39703329", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4941408708546798, "ground_truth": 0}, {"key": "39703329", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0933468723473311, "ground_truth": 0}, {"key": "39703329", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765261956894872, "ground_truth": 0}, {"key": "39703329", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304215086360462, "ground_truth": 0}, {"key": "34033324", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20946969143004363, "ground_truth": 0}, {"key": "34033324", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07807816090909844, "ground_truth": 0}, {"key": "34033324", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09602548821282485, "ground_truth": 0}, {"key": "34033324", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798743202992735, "ground_truth": 0}, {"key": "34033324", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608725093249778, "ground_truth": 0}, {"key": "35658862", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06804042274899139, "ground_truth": 0}, {"key": "35658862", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11516223622496259, "ground_truth": 0}, {"key": "35658862", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10302442372588844, "ground_truth": 0}, {"key": "35658862", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263670487156305, "ground_truth": 0}, {"key": "35658862", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07696083777840704, "ground_truth": 0}, {"key": "36092657", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0786423820041562, "ground_truth": 0}, {"key": "36092657", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09534946472936452, "ground_truth": 0}, {"key": "36092657", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09334687420164138, "ground_truth": 0}, {"key": "36092657", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030908960401414557, "ground_truth": 0}, {"key": "36092657", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06008664728709595, "ground_truth": 0}, {"key": "26333438", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20307462571985999, "ground_truth": 0}, {"key": "26333438", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15304215486048778, "ground_truth": 0}, {"key": "26333438", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16344543737290818, "ground_truth": 0}, {"key": "26333438", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447731685089107, "ground_truth": 0}, {"key": "26333438", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304216041316093, "ground_truth": 0}, {"key": "34184963", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09334687446771137, "ground_truth": 0}, {"key": "34184963", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08882028898811391, "ground_truth": 0}, {"key": "34184963", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026255299408703494, "ground_truth": 0}, {"key": "34184963", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01994693437904481, "ground_truth": 0}, {"key": "34184963", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06954173984598312, "ground_truth": 0}, {"key": "35069975", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03649376607468777, "ground_truth": 0}, {"key": "35069975", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.024892802990529195, "ground_truth": 0}, {"key": "35069975", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03488088825248139, "ground_truth": 0}, {"key": "35069975", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02953533795769148, "ground_truth": 0}, {"key": "35069975", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.006463137850694331, "ground_truth": 0}, {"key": "36443950", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04468087261224697, "ground_truth": 0}, {"key": "36443950", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1361483195780744, "ground_truth": 0}, {"key": "36443950", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07640768139126043, "ground_truth": 0}, {"key": "36443950", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08389039253445811, "ground_truth": 0}, {"key": "36443950", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575785187664, "ground_truth": 0}, {"key": "29460858", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03993731856827445, "ground_truth": 0}, {"key": "29460858", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04672495723207891, "ground_truth": 0}, {"key": "29460858", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0872522476206174, "ground_truth": 0}, {"key": "29460858", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022542964972793084, "ground_truth": 0}, {"key": "29460858", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.021698099334736366, "ground_truth": 0}, {"key": "36155704", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05707139846121916, "ground_truth": 0}, {"key": "36155704", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013222822082740636, "ground_truth": 0}, {"key": "36155704", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02976009224383655, "ground_truth": 0}, {"key": "36155704", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020964239955161657, "ground_truth": 0}, {"key": "36155704", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01861780166205316, "ground_truth": 0}, {"key": "37185211", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01584536054287595, "ground_truth": 0}, {"key": "37185211", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012970388352300926, "ground_truth": 0}, {"key": "37185211", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010652511761551397, "ground_truth": 0}, {"key": "37185211", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03732688510564415, "ground_truth": 0}, {"key": "37185211", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008315779073673549, "ground_truth": 0}, {"key": "36454885", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.025760558895696915, "ground_truth": 0}, {"key": "36454885", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.017848737887418076, "ground_truth": 0}, {"key": "36454885", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03488088975787638, "ground_truth": 0}, {"key": "36454885", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04468087321146928, "ground_truth": 0}, {"key": "36454885", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040087356850670844, "ground_truth": 0}, {"key": "33148906", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02262919918539718, "ground_truth": 0}, {"key": "33148906", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020804490758130543, "ground_truth": 0}, {"key": "33148906", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02145073022803095, "ground_truth": 0}, {"key": "33148906", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02228618521890095, "ground_truth": 0}, {"key": "33148906", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05460060616364299, "ground_truth": 0}, {"key": "18086604", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10302442676065962, "ground_truth": 0}, {"key": "18086604", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07369627097491462, "ground_truth": 0}, {"key": "18086604", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03594832193892973, "ground_truth": 0}, {"key": "18086604", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08006926567122558, "ground_truth": 0}, {"key": "18086604", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04922211727917462, "ground_truth": 0}, {"key": "33693397", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2186693782494579, "ground_truth": 0}, {"key": "33693397", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05281402506001575, "ground_truth": 0}, {"key": "33693397", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07185126832117888, "ground_truth": 0}, {"key": "33693397", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05791808928883348, "ground_truth": 0}, {"key": "33693397", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06632687022155177, "ground_truth": 0}, {"key": "39501530", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01450357974951009, "ground_truth": 0}, {"key": "39501530", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.024237633656702846, "ground_truth": 0}, {"key": "39501530", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.009376237424431662, "ground_truth": 0}, {"key": "39501530", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02800752206696619, "ground_truth": 0}, {"key": "39501530", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04336579927868536, "ground_truth": 0}, {"key": "30948874", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17553806568506639, "ground_truth": 0}, {"key": "30948874", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5175708800518326, "ground_truth": 0}, {"key": "30948874", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.26208568774896235, "ground_truth": 0}, {"key": "30948874", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733751505453489, "ground_truth": 0}, {"key": "30948874", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206881211167208, "ground_truth": 0}, {"key": "39410675", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03185885710430026, "ground_truth": 0}, {"key": "39410675", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.041152885084241954, "ground_truth": 0}, {"key": "39410675", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.059646938698045236, "ground_truth": 0}, {"key": "39410675", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.056652422420304646, "ground_truth": 0}, {"key": "39410675", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07585817979175291, "ground_truth": 0}, {"key": "32903337", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06560483220216444, "ground_truth": 0}, {"key": "32903337", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03663136479871268, "ground_truth": 0}, {"key": "32903337", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07640768215994437, "ground_truth": 0}, {"key": "32903337", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.037326886412482, "ground_truth": 0}, {"key": "32903337", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04922211656848704, "ground_truth": 0}, {"key": "27685132", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08694166042247206, "ground_truth": 0}, {"key": "27685132", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07004896168439313, "ground_truth": 0}, {"key": "27685132", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01798620917205737, "ground_truth": 0}, {"key": "27685132", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04569203049792551, "ground_truth": 0}, {"key": "27685132", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.044018656716132594, "ground_truth": 0}, {"key": "22791471", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07585818536932934, "ground_truth": 0}, {"key": "22791471", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09401018351359215, "ground_truth": 0}, {"key": "22791471", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1530421484098879, "ground_truth": 0}, {"key": "22791471", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07864238252180107, "ground_truth": 0}, {"key": "22791471", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0809367106903201, "ground_truth": 0}, {"key": "32292348", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.023689471322806573, "ground_truth": 0}, {"key": "32292348", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04385456362465882, "ground_truth": 0}, {"key": "32292348", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03934250378187242, "ground_truth": 0}, {"key": "32292348", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05033063071339744, "ground_truth": 0}, {"key": "32292348", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02479816185692373, "ground_truth": 0}, {"key": "20482930", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03775027608935582, "ground_truth": 0}, {"key": "20482930", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05856082672272356, "ground_truth": 0}, {"key": "20482930", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05480259333185665, "ground_truth": 0}, {"key": "20482930", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.053403335309986665, "ground_truth": 0}, {"key": "20482930", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07263670427386411, "ground_truth": 0}, {"key": "11635754", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027169233023811794, "ground_truth": 0}, {"key": "11635754", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07423136966501366, "ground_truth": 0}, {"key": "11635754", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09367800170709707, "ground_truth": 0}, {"key": "11635754", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05500528638461829, "ground_truth": 0}, {"key": "11635754", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08632347595813143, "ground_truth": 0}, {"key": "40029096", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10447731935894727, "ground_truth": 0}, {"key": "40029096", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05520868796690532, "ground_truth": 0}, {"key": "40029096", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11357958602103183, "ground_truth": 0}, {"key": "40029096", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04518375434528065, "ground_truth": 0}, {"key": "40029096", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07640767876331947, "ground_truth": 0}, {"key": "40414719", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.372048792730384, "ground_truth": 0}, {"key": "40414719", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.42632160134864816, "ground_truth": 0}, {"key": "40414719", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.40356687932219687, "ground_truth": 0}, {"key": "40414719", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030917417947, "ground_truth": 0}, {"key": "40414719", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199147280387, "ground_truth": 0}, {"key": "39537616", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027066174371266415, "ground_truth": 0}, {"key": "39537616", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.006192990493222061, "ground_truth": 0}, {"key": "39537616", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05707139784768393, "ground_truth": 0}, {"key": "39537616", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03775027544242967, "ground_truth": 0}, {"key": "39537616", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.019870714178893554, "ground_truth": 0}, {"key": "33245830", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.47463117758003415, "ground_truth": 0}, {"key": "33245830", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15203224861535922, "ground_truth": 0}, {"key": "33245830", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19930800859712236, "ground_truth": 0}, {"key": "33245830", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.32423539100781956, "ground_truth": 0}, {"key": "33245830", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804322895911, "ground_truth": 0}, {"key": "39243601", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5736784192436942, "ground_truth": 0}, {"key": "39243601", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27982849974767093, "ground_truth": 0}, {"key": "39243601", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4167966519586819, "ground_truth": 0}, {"key": "39243601", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.484380110798134, "ground_truth": 0}, {"key": "39243601", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014734742334493, "ground_truth": 0}, {"key": "35815905", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03663136503378995, "ground_truth": 0}, {"key": "35815905", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06954174110641748, "ground_truth": 0}, {"key": "35815905", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.037047170487902396, "ground_truth": 0}, {"key": "35815905", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02297737016013555, "ground_truth": 0}, {"key": "35815905", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08449275299411407, "ground_truth": 0}, {"key": "35260212", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1431877039796076, "ground_truth": 0}, {"key": "35260212", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09947020646586564, "ground_truth": 0}, {"key": "35260212", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06954174144424029, "ground_truth": 0}, {"key": "35260212", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.042087727373780574, "ground_truth": 0}, {"key": "35260212", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.044018655420036086, "ground_truth": 0}, {"key": "39193924", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11920291902146084, "ground_truth": 0}, {"key": "39193924", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22270014275708433, "ground_truth": 0}, {"key": "39193924", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13028541540260236, "ground_truth": 0}, {"key": "39193924", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838509545574225, "ground_truth": 0}, {"key": "39193924", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23934934503819366, "ground_truth": 0}, {"key": "40658569", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03474962660104715, "ground_truth": 0}, {"key": "40658569", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07779744711434856, "ground_truth": 0}, {"key": "40658569", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.032466816769360855, "ground_truth": 0}, {"key": "40658569", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07107366625590598, "ground_truth": 0}, {"key": "40658569", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05360114427029925, "ground_truth": 0}, {"key": "33497596", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23651623729920485, "ground_truth": 0}, {"key": "33497596", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07723879182124622, "ground_truth": 0}, {"key": "33497596", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17106118436540538, "ground_truth": 0}, {"key": "33497596", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08359066753138943, "ground_truth": 0}, {"key": "33497596", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14706452893416028, "ground_truth": 0}, {"key": "40339241", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.029312230654497645, "ground_truth": 0}, {"key": "40339241", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.039342505472969705, "ground_truth": 0}, {"key": "40339241", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08787643875838472, "ground_truth": 0}, {"key": "40339241", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020023440307453906, "ground_truth": 0}, {"key": "40339241", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.049773445793005376, "ground_truth": 0}, {"key": "31792608", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15507846917667478, "ground_truth": 0}, {"key": "31792608", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08329192753636466, "ground_truth": 0}, {"key": "31792608", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1744102789000519, "ground_truth": 0}, {"key": "31792608", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13568954533008434, "ground_truth": 0}, {"key": "31792608", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16885694918181046, "ground_truth": 0}, {"key": "33132662", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10521053129444567, "ground_truth": 0}, {"key": "33132662", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17106117891322795, "ground_truth": 0}, {"key": "33132662", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13939638023120046, "ground_truth": 0}, {"key": "33132662", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07504072306438538, "ground_truth": 0}, {"key": "33132662", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.060529390734633495, "ground_truth": 0}, {"key": "37577457", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08663206736523177, "ground_truth": 0}, {"key": "37577457", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.039787809410608097, "ground_truth": 0}, {"key": "37577457", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012147169701772079, "ground_truth": 0}, {"key": "37577457", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09739040223518564, "ground_truth": 0}, {"key": "37577457", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.028761588567417458, "ground_truth": 0}, {"key": "38701278", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2011847289415492, "ground_truth": 0}, {"key": "38701278", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3073580158985606, "ground_truth": 0}, {"key": "38701278", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16451645859672992, "ground_truth": 0}, {"key": "38701278", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.128963303125127, "ground_truth": 0}, {"key": "38701278", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14080817423212194, "ground_truth": 0}, {"key": "34570783", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16184942185941956, "ground_truth": 0}, {"key": "34570783", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.046205751591784236, "ground_truth": 0}, {"key": "34570783", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.059646944999932054, "ground_truth": 0}, {"key": "34570783", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.031026178919988025, "ground_truth": 0}, {"key": "34570783", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0663268718505903, "ground_truth": 0}, {"key": "39064526", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06608537998782077, "ground_truth": 0}, {"key": "39064526", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.018546563964693768, "ground_truth": 0}, {"key": "39064526", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09009299552383256, "ground_truth": 0}, {"key": "39064526", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04885777966774491, "ground_truth": 0}, {"key": "39064526", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09602548923996258, "ground_truth": 0}, {"key": "40741545", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5660185331370642, "ground_truth": 0}, {"key": "40741545", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3311197169145104, "ground_truth": 0}, {"key": "40741545", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4186969327051687, "ground_truth": 0}, {"key": "40741545", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926276844389, "ground_truth": 0}, {"key": "40741545", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.26133092474450503, "ground_truth": 0}, {"key": "36929751", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2893717041114747, "ground_truth": 0}, {"key": "36929751", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3611647317330268, "ground_truth": 0}, {"key": "36929751", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3165805048490366, "ground_truth": 0}, {"key": "36929751", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.265118709958298, "ground_truth": 0}, {"key": "36929751", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897339012573, "ground_truth": 0}, {"key": "23984730", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.007636216255125638, "ground_truth": 0}, {"key": "23984730", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01052971177013292, "ground_truth": 0}, {"key": "23984730", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012624948904213687, "ground_truth": 0}, {"key": "23984730", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016340128361169808, "ground_truth": 0}, {"key": "23984730", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02315341137509945, "ground_truth": 0}, {"key": "36007415", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16451645498354633, "ground_truth": 0}, {"key": "36007415", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4571367010746828, "ground_truth": 0}, {"key": "36007415", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3812195777840851, "ground_truth": 0}, {"key": "36007415", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33372032038093563, "ground_truth": 0}, {"key": "36007415", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.558326989724462, "ground_truth": 0}, {"key": "38875041", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03461883843486238, "ground_truth": 0}, {"key": "38875041", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.016152834764565176, "ground_truth": 0}, {"key": "38875041", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09401018400864336, "ground_truth": 0}, {"key": "38875041", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10017222193266595, "ground_truth": 0}, {"key": "38875041", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09877259237196481, "ground_truth": 0}]