[{"key": "35232142", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.26435834108343415, "ground_truth": 0}, {"key": "35232142", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.14223190037424951, "ground_truth": 0}, {"key": "35232142", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2925953213129459, "ground_truth": 0}, {"key": "35232142", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758416306157, "ground_truth": 0}, {"key": "35232142", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3647775667726071, "ground_truth": 0}, {"key": "40143035", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7704647844238259, "ground_truth": 0}, {"key": "40143035", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6842640144411147, "ground_truth": 0}, {"key": "40143035", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7866228454073015, "ground_truth": 0}, {"key": "40143035", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267872812367, "ground_truth": 0}, {"key": "40143035", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526042887765, "ground_truth": 0}, {"key": "35951548", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3225259837086528, "ground_truth": 0}, {"key": "35951548", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2227001508770008, "ground_truth": 0}, {"key": "35951548", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.09877259125073969, "ground_truth": 0}, {"key": "35951548", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583784329991, "ground_truth": 0}, {"key": "35951548", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132022305345425, "ground_truth": 0}, {"key": "36266422", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5175708632203133, "ground_truth": 0}, {"key": "36266422", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7401743585558792, "ground_truth": 0}, {"key": "36266422", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5869964468471818, "ground_truth": 0}, {"key": "36266422", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082680980693, "ground_truth": 0}, {"key": "36266422", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687308340133777, "ground_truth": 0}, {"key": "38826984", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.668880251042464, "ground_truth": 0}, {"key": "38826984", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4513265017051809, "ground_truth": 0}, {"key": "38826984", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6150878707690973, "ground_truth": 0}, {"key": "38826984", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318583780314, "ground_truth": 0}, {"key": "38826984", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.651354868338138, "ground_truth": 0}, {"key": "34540833", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44746029080232624, "ground_truth": 0}, {"key": "34540833", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7122321824840743, "ground_truth": 0}, {"key": "34540833", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6095241615816895, "ground_truth": 0}, {"key": "34540833", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689596669246, "ground_truth": 0}, {"key": "34540833", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014733444207115, "ground_truth": 0}, {"key": "20836172", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8606036178273309, "ground_truth": 0}, {"key": "20836172", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9073122176599552, "ground_truth": 0}, {"key": "20836172", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8895288442038668, "ground_truth": 0}, {"key": "20836172", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578396737147, "ground_truth": 0}, {"key": "20836172", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920169951072, "ground_truth": 0}, {"key": "35932467", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5331544087916466, "ground_truth": 0}, {"key": "35932467", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.36116472064283994, "ground_truth": 0}, {"key": "35932467", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.611381996599894, "ground_truth": 0}, {"key": "35932467", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167647560546, "ground_truth": 0}, {"key": "35932467", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165326891497, "ground_truth": 0}, {"key": "40758845", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7853085832552898, "ground_truth": 0}, {"key": "40758845", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7201715279633787, "ground_truth": 0}, {"key": "40758845", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7279754326711212, "ground_truth": 0}, {"key": "40758845", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358437645917, "ground_truth": 0}, {"key": "40758845", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936459367008, "ground_truth": 0}, {"key": "30358490", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7549149946769856, "ground_truth": 0}, {"key": "30358490", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5583269682993386, "ground_truth": 0}, {"key": "30358490", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8210441173399323, "ground_truth": 0}, {"key": "30358490", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278583161752, "ground_truth": 0}, {"key": "30358490", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802501144666, "ground_truth": 0}, {"key": "34615665", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8322366524653726, "ground_truth": 0}, {"key": "34615665", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8255897245278633, "ground_truth": 0}, {"key": "34615665", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359800073533, "ground_truth": 0}, {"key": "34615665", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9669140204882007, "ground_truth": 0}, {"key": "34615665", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9111797055947362, "ground_truth": 0}, {"key": "35890902", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6584175170488473, "ground_truth": 0}, {"key": "35890902", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6976089056833115, "ground_truth": 0}, {"key": "35890902", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4882833933620864, "ground_truth": 0}, {"key": "35890902", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.694302677313186, "ground_truth": 0}, {"key": "35890902", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714979717923, "ground_truth": 0}, {"key": "37922330", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7918210610171965, "ground_truth": 0}, {"key": "37922330", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5117166079524209, "ground_truth": 0}, {"key": "37922330", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6076631546961135, "ground_truth": 0}, {"key": "37922330", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210616261152, "ground_truth": 0}, {"key": "37922330", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740190149856, "ground_truth": 0}, {"key": "30844962", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2173375187373702, "ground_truth": 0}, {"key": "30844962", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.46490159301725653, "ground_truth": 0}, {"key": "30844962", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5486734862475033, "ground_truth": 0}, {"key": "30844962", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.268941438053809, "ground_truth": 0}, {"key": "30844962", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1699562256500258, "ground_truth": 0}, {"key": "36217333", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4167966679648345, "ground_truth": 0}, {"key": "36217333", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41679665376101055, "ground_truth": 0}, {"key": "36217333", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4167966405471359, "ground_truth": 0}, {"key": "36217333", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687309555030577, "ground_truth": 0}, {"key": "36217333", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.466845586575207, "ground_truth": 0}, {"key": "30816523", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6992544137029307, "ground_truth": 0}, {"key": "30816523", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185239882832, "ground_truth": 0}, {"key": "30816523", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477982303739674, "ground_truth": 0}, {"key": "30816523", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641426083232, "ground_truth": 0}, {"key": "30816523", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828340111657337, "ground_truth": 0}, {"key": "38900884", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8643104378952051, "ground_truth": 0}, {"key": "38900884", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7969253644321119, "ground_truth": 0}, {"key": "38900884", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.910545397979998, "ground_truth": 0}, {"key": "38900884", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.710628299095714, "ground_truth": 0}, {"key": "38900884", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884817579427, "ground_truth": 0}, {"key": "13890581", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7431680382448872, "ground_truth": 0}, {"key": "13890581", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6132365551974336, "ground_truth": 0}, {"key": "13890581", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7106282990067637, "ground_truth": 0}, {"key": "13890581", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125583926948, "ground_truth": 0}, {"key": "13890581", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303089379568, "ground_truth": 0}, {"key": "40194700", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7505527789919829, "ground_truth": 0}, {"key": "40194700", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8519527941755896, "ground_truth": 0}, {"key": "40194700", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8289388115493003, "ground_truth": 0}, {"key": "40194700", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9376689696731049, "ground_truth": 0}, {"key": "40194700", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105532499215, "ground_truth": 0}, {"key": "37903647", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.22405544491481755, "ground_truth": 0}, {"key": "37903647", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238975703966, "ground_truth": 0}, {"key": "37903647", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2568320105827168, "ground_truth": 0}, {"key": "37903647", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495179223142, "ground_truth": 0}, {"key": "37903647", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783700749466, "ground_truth": 0}, {"key": "13291223", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6279512248912376, "ground_truth": 0}, {"key": "13291223", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6057990578744472, "ground_truth": 0}, {"key": "13291223", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.592666609712631, "ground_truth": 0}, {"key": "13291223", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708869434469, "ground_truth": 0}, {"key": "13291223", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984771479198, "ground_truth": 0}, {"key": "36052570", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43206341887309613, "ground_truth": 0}, {"key": "36052570", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5621764729145645, "ground_truth": 0}, {"key": "36052570", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7401743512260045, "ground_truth": 0}, {"key": "36052570", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804688379172535, "ground_truth": 0}, {"key": "36052570", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358175157718, "ground_truth": 0}, {"key": "34944735", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.41300359778907975, "ground_truth": 0}, {"key": "34944735", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45132650047101774, "ground_truth": 0}, {"key": "34944735", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5428633007949056, "ground_truth": 0}, {"key": "34944735", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666226192534, "ground_truth": 0}, {"key": "34944735", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880117973718, "ground_truth": 0}, {"key": "32159602", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2974699373579225, "ground_truth": 0}, {"key": "32159602", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5679365936360555, "ground_truth": 0}, {"key": "32159602", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3208213051451991, "ground_truth": 0}, {"key": "32159602", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33807711718831657, "ground_truth": 0}, {"key": "32159602", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771248668806, "ground_truth": 0}, {"key": "34988915", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44167301287328076, "ground_truth": 0}, {"key": "34988915", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5058591083459649, "ground_truth": 0}, {"key": "34988915", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3738758197330634, "ground_truth": 0}, {"key": "34988915", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508501345720635, "ground_truth": 0}, {"key": "34988915", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633944572908, "ground_truth": 0}, {"key": "37889203", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8278281556268737, "ground_truth": 0}, {"key": "37889203", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9173026517484636, "ground_truth": 0}, {"key": "37889203", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8140527908203683, "ground_truth": 0}, {"key": "37889203", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951085081465, "ground_truth": 0}, {"key": "37889203", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.854884627865306, "ground_truth": 0}, {"key": "33609927", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3123700031659476, "ground_truth": 0}, {"key": "33609927", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3433417511625021, "ground_truth": 0}, {"key": "33609927", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4359015272036169, "ground_truth": 0}, {"key": "33609927", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4320633760097813, "ground_truth": 0}, {"key": "33609927", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869691648207047, "ground_truth": 0}, {"key": "33578778", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5794004245478731, "ground_truth": 0}, {"key": "33578778", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6261241891717205, "ground_truth": 0}, {"key": "33578778", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5331543760045777, "ground_truth": 0}, {"key": "33578778", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880441652159, "ground_truth": 0}, {"key": "33578778", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216352481991, "ground_truth": 0}, {"key": "36888270", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8438950988584262, "ground_truth": 0}, {"key": "36888270", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7325918632080219, "ground_truth": 0}, {"key": "36888270", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.754914982858919, "ground_truth": 0}, {"key": "36888270", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080714812076, "ground_truth": 0}, {"key": "36888270", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701042382761, "ground_truth": 0}, {"key": "36846007", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.954307969233762, "ground_truth": 0}, {"key": "36846007", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9801292885037448, "ground_truth": 0}, {"key": "36846007", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9686195702397316, "ground_truth": 0}, {"key": "36846007", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9412234451215961, "ground_truth": 0}, {"key": "36846007", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.951863228855887, "ground_truth": 0}, {"key": "31723471", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9207896765409712, "ground_truth": 0}, {"key": "31723471", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7956580847702962, "ground_truth": 0}, {"key": "31723471", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6352224201239806, "ground_truth": 0}, {"key": "31723471", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837602109025, "ground_truth": 0}, {"key": "31723471", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493193970386, "ground_truth": 0}, {"key": "15921828", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2436424168039928, "ground_truth": 0}, {"key": "15921828", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.361164732566485, "ground_truth": 0}, {"key": "15921828", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43014736840008594, "ground_truth": 0}, {"key": "15921828", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276682929306688, "ground_truth": 0}, {"key": "15921828", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047584809158237, "ground_truth": 0}, {"key": "39109408", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.281405598454496, "ground_truth": 0}, {"key": "39109408", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1550784688046993, "ground_truth": 0}, {"key": "39109408", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.21866937940098047, "ground_truth": 0}, {"key": "39109408", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519861033149606, "ground_truth": 0}, {"key": "39109408", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944723188899348, "ground_truth": 0}, {"key": "20936833", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.14318769910772042, "ground_truth": 0}, {"key": "20936833", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.08269734316553297, "ground_truth": 0}, {"key": "20936833", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.16132024397164385, "ground_truth": 0}, {"key": "20936833", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667159106265823, "ground_truth": 0}, {"key": "20936833", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.07211220394742598, "ground_truth": 0}, {"key": "36832879", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5945512482892211, "ground_truth": 0}, {"key": "36832879", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819751785238, "ground_truth": 0}, {"key": "36832879", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5907792423508629, "ground_truth": 0}, {"key": "36832879", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468895672893, "ground_truth": 0}, {"key": "36832879", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966646563183, "ground_truth": 0}, {"key": "14958201", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8289388011385419, "ground_truth": 0}, {"key": "14958201", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8418256500450217, "ground_truth": 0}, {"key": "14958201", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6406358773395084, "ground_truth": 0}, {"key": "14958201", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673138597629, "ground_truth": 0}, {"key": "14958201", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148271084704, "ground_truth": 0}, {"key": "34352262", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.07107366854467947, "ground_truth": 0}, {"key": "34352262", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.18476750723774418, "ground_truth": 0}, {"key": "34352262", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.10087862307123065, "ground_truth": 0}, {"key": "34352262", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.13206615227085153, "ground_truth": 0}, {"key": "34352262", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.08509904167116664, "ground_truth": 0}, {"key": "39805395", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2861692612392806, "ground_truth": 0}, {"key": "39805395", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.11838508928327449, "ground_truth": 0}, {"key": "39805395", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42632161180039474, "ground_truth": 0}, {"key": "39805395", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3398275938814091, "ground_truth": 0}, {"key": "39805395", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939171511336135, "ground_truth": 0}, {"key": "34303109", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30569731329398947, "ground_truth": 0}, {"key": "34303109", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.28616923107735703, "ground_truth": 0}, {"key": "34303109", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.47657964244953355, "ground_truth": 0}, {"key": "34303109", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590150052523896, "ground_truth": 0}, {"key": "34303109", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238596029945, "ground_truth": 0}, {"key": "39939090", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8278281469748556, "ground_truth": 0}, {"key": "39939090", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8044059126502489, "ground_truth": 0}, {"key": "39939090", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7676898625357162, "ground_truth": 0}, {"key": "39939090", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581552680939, "ground_truth": 0}, {"key": "39939090", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563433159933, "ground_truth": 0}, {"key": "29347771", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6224593270289205, "ground_truth": 0}, {"key": "29347771", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.679178708532776, "ground_truth": 0}, {"key": "29347771", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8479677564167707, "ground_truth": 0}, {"key": "29347771", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504653776795, "ground_truth": 0}, {"key": "29347771", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624673937613, "ground_truth": 0}, {"key": "36783415", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6876299906854292, "ground_truth": 0}, {"key": "36783415", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.472683491741357, "ground_truth": 0}, {"key": "36783415", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.64957862117838, "ground_truth": 0}, {"key": "36783415", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269102797155, "ground_truth": 0}, {"key": "36783415", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368161209492, "ground_truth": 0}, {"key": "37935687", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6442250830209278, "ground_truth": 0}, {"key": "37935687", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8386797728729393, "ground_truth": 0}, {"key": "37935687", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7676898658809045, "ground_truth": 0}, {"key": "37935687", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489722081151078, "ground_truth": 0}, {"key": "37935687", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.770464790079577, "ground_truth": 0}, {"key": "40260829", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.877476782647749, "ground_truth": 0}, {"key": "40260829", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8643104537812113, "ground_truth": 0}, {"key": "40260829", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9005297792581012, "ground_truth": 0}, {"key": "40260829", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059623215306, "ground_truth": 0}, {"key": "40260829", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063682151906, "ground_truth": 0}, {"key": "36478199", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7325918216093861, "ground_truth": 0}, {"key": "36478199", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6893055924359965, "ground_truth": 0}, {"key": "36478199", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7592254143989711, "ground_truth": 0}, {"key": "36478199", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990634193122, "ground_truth": 0}, {"key": "36478199", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527617540697, "ground_truth": 0}, {"key": "34541803", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5195213045944819, "ground_truth": 0}, {"key": "34541803", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4301473386746086, "ground_truth": 0}, {"key": "34541803", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4649015982921517, "ground_truth": 0}, {"key": "34541803", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023558968821995, "ground_truth": 0}, {"key": "34541803", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511644267766, "ground_truth": 0}, {"key": "35360841", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8289387951581647, "ground_truth": 0}, {"key": "35360841", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7994423106949295, "ground_truth": 0}, {"key": "35360841", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7505527707293773, "ground_truth": 0}, {"key": "35360841", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918304412736, "ground_truth": 0}, {"key": "35360841", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789112037533, "ground_truth": 0}, {"key": "35550407", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.602061598180559, "ground_truth": 0}, {"key": "35550407", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6224593610315949, "ground_truth": 0}, {"key": "35550407", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.523420377547982, "ground_truth": 0}, {"key": "35550407", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704844557509, "ground_truth": 0}, {"key": "35550407", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269573002653, "ground_truth": 0}, {"key": "37561590", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5660185678702729, "ground_truth": 0}, {"key": "37561590", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.635222455480651, "ground_truth": 0}, {"key": "37561590", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359812799441, "ground_truth": 0}, {"key": "37561590", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185944069410418, "ground_truth": 0}, {"key": "37561590", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689388016933, "ground_truth": 0}, {"key": "39328843", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8856314814485203, "ground_truth": 0}, {"key": "39328843", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9213576268267257, "ground_truth": 0}, {"key": "39328843", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8918110395858173, "ground_truth": 0}, {"key": "39328843", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9597620554267885, "ground_truth": 0}, {"key": "39328843", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080776807162, "ground_truth": 0}, {"key": "35389665", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9324533095693075, "ground_truth": 0}, {"key": "35389665", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9658995684560316, "ground_truth": 0}, {"key": "35389665", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9566342027792738, "ground_truth": 0}, {"key": "35389665", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9724147196724433, "ground_truth": 0}, {"key": "35389665", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9529258253961858, "ground_truth": 0}, {"key": "33080187", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.38491215405728135, "ground_truth": 0}, {"key": "33080187", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.16238003520440583, "ground_truth": 0}, {"key": "33080187", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1801066700006251, "ground_truth": 0}, {"key": "33080187", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124121483063262, "ground_truth": 0}, {"key": "33080187", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757214237157308, "ground_truth": 0}, {"key": "38636995", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5774953621253229, "ground_truth": 0}, {"key": "38636995", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7248702883355961, "ground_truth": 0}, {"key": "38636995", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5544704584116673, "ground_truth": 0}, {"key": "38636995", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185348188772, "ground_truth": 0}, {"key": "38636995", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149924735831, "ground_truth": 0}, {"key": "18536236", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6859494619064476, "ground_truth": 0}, {"key": "18536236", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.566018520897266, "ground_truth": 0}, {"key": "18536236", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5544704512858363, "ground_truth": 0}, {"key": "18536236", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308014459476, "ground_truth": 0}, {"key": "18536236", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011531838943, "ground_truth": 0}, {"key": "36289151", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.46879063798344894, "ground_truth": 0}, {"key": "36289151", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5869964268399249, "ground_truth": 0}, {"key": "36289151", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6943026807125399, "ground_truth": 0}, {"key": "36289151", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633650928675, "ground_truth": 0}, {"key": "36289151", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544048872284, "ground_truth": 0}, {"key": "23017045", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6477982085931423, "ground_truth": 0}, {"key": "23017045", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6495786333832767, "ground_truth": 0}, {"key": "23017045", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7704647786529484, "ground_truth": 0}, {"key": "23017045", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526315608057, "ground_truth": 0}, {"key": "23017045", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461390070200076, "ground_truth": 0}, {"key": "36418082", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.870597284771826, "ground_truth": 0}, {"key": "36418082", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5273165301078737, "ground_truth": 0}, {"key": "36418082", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7853085875123954, "ground_truth": 0}, {"key": "36418082", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228153565845, "ground_truth": 0}, {"key": "36418082", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878801343264, "ground_truth": 0}, {"key": "34396551", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6876300150577469, "ground_truth": 0}, {"key": "34396551", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5774953586395424, "ground_truth": 0}, {"key": "34396551", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7416740131230177, "ground_truth": 0}, {"key": "34396551", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.19682619959860306, "ground_truth": 0}, {"key": "34396551", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2068940513675779, "ground_truth": 0}, {"key": "39720944", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.914900958654551, "ground_truth": 0}, {"key": "39720944", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8902942288150851, "ground_truth": 0}, {"key": "39720944", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9294403941994537, "ground_truth": 0}, {"key": "39720944", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.913676525336682, "ground_truth": 0}, {"key": "39720944", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632873119765, "ground_truth": 0}, {"key": "35884842", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4668455860829825, "ground_truth": 0}, {"key": "35884842", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4282334038953805, "ground_truth": 0}, {"key": "35884842", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.457136690550998, "ground_truth": 0}, {"key": "35884842", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418479290373, "ground_truth": 0}, {"key": "35884842", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101677271450003, "ground_truth": 0}, {"key": "35403375", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.29421494247134466, "ground_truth": 0}, {"key": "35403375", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2094696780890369, "ground_truth": 0}, {"key": "35403375", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3073580149625967, "ground_truth": 0}, {"key": "35403375", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906335790735, "ground_truth": 0}, {"key": "35403375", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38676344806499274, "ground_truth": 0}, {"key": "26341324", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8267117921614475, "ground_truth": 0}, {"key": "26341324", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.744656334594235, "ground_truth": 0}, {"key": "26341324", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8344068931579002, "ground_truth": 0}, {"key": "26341324", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757645776946504, "ground_truth": 0}, {"key": "26341324", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397137664955, "ground_truth": 0}, {"key": "19212345", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8311430532322196, "ground_truth": 0}, {"key": "19212345", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8187367831808967, "ground_truth": 0}, {"key": "19212345", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8661325172697798, "ground_truth": 0}, {"key": "19212345", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513749879395, "ground_truth": 0}, {"key": "19212345", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505390489578, "ground_truth": 0}, {"key": "30548367", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7371581624980201, "ground_truth": 0}, {"key": "30548367", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6757645888541428, "ground_truth": 0}, {"key": "30548367", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6926419720182538, "ground_truth": 0}, {"key": "30548367", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936595511782, "ground_truth": 0}, {"key": "30548367", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430569516046, "ground_truth": 0}, {"key": "37919402", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8479677602746859, "ground_truth": 0}, {"key": "37919402", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9073122239387872, "ground_truth": 0}, {"key": "37919402", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8940517287307636, "ground_truth": 0}, {"key": "37919402", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970702379986, "ground_truth": 0}, {"key": "37919402", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519527913990416, "ground_truth": 0}, {"key": "39995133", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.841825651446342, "ground_truth": 0}, {"key": "39995133", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9637799436971112, "ground_truth": 0}, {"key": "39995133", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9640516798723363, "ground_truth": 0}, {"key": "39995133", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179817742178, "ground_truth": 0}, {"key": "39995133", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.822189134320385, "ground_truth": 0}, {"key": "40249088", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6460136998296846, "ground_truth": 0}, {"key": "40249088", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8300437785076964, "ground_truth": 0}, {"key": "40249088", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44167299573781893, "ground_truth": 0}, {"key": "40249088", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585845690235, "ground_truth": 0}, {"key": "40249088", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311988790612, "ground_truth": 0}, {"key": "40254388", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.38676342440065437, "ground_truth": 0}, {"key": "40254388", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5389832247575695, "ground_truth": 0}, {"key": "40254388", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5506073883114609, "ground_truth": 0}, {"key": "40254388", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105510089513, "ground_truth": 0}, {"key": "40254388", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666532705082, "ground_truth": 0}, {"key": "31995230", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8661325242480774, "ground_truth": 0}, {"key": "31995230", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7786493134812138, "ground_truth": 0}, {"key": "31995230", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9053222987216106, "ground_truth": 0}, {"key": "31995230", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338532856457, "ground_truth": 0}, {"key": "31995230", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9626731175399319, "ground_truth": 0}, {"key": "38632129", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9529258236293366, "ground_truth": 0}, {"key": "38632129", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9252299576431076, "ground_truth": 0}, {"key": "38632129", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9653811631015619, "ground_truth": 0}, {"key": "38632129", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099635955431, "ground_truth": 0}, {"key": "38632129", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647021911848, "ground_truth": 0}, {"key": "35720795", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6791787192836671, "ground_truth": 0}, {"key": "35720795", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8116760228249639, "ground_truth": 0}, {"key": "35720795", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6076631368745141, "ground_truth": 0}, {"key": "35720795", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671346515537, "ground_truth": 0}, {"key": "35720795", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316948121626, "ground_truth": 0}, {"key": "23906759", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5755879828135574, "ground_truth": 0}, {"key": "23906759", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8418256680815598, "ground_truth": 0}, {"key": "23906759", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7799928920693303, "ground_truth": 0}, {"key": "23906759", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253716117951, "ground_truth": 0}, {"key": "23906759", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.732591829430633, "ground_truth": 0}, {"key": "19410108", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.618780433623383, "ground_truth": 0}, {"key": "19410108", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7718435021283667, "ground_truth": 0}, {"key": "19410108", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6706082738919087, "ground_truth": 0}, {"key": "19410108", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.646013691321394, "ground_truth": 0}, {"key": "19410108", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241902811721, "ground_truth": 0}, {"key": "30745137", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48438009856114556, "ground_truth": 0}, {"key": "30745137", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.451326529958065, "ground_truth": 0}, {"key": "30745137", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5214711832633305, "ground_truth": 0}, {"key": "30745137", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526731731129, "ground_truth": 0}, {"key": "30745137", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828339589818714, "ground_truth": 0}, {"key": "26553115", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2689414198949145, "ground_truth": 0}, {"key": "26553115", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.36116474490187667, "ground_truth": 0}, {"key": "26553115", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.24944725837270826, "ground_truth": 0}, {"key": "26553115", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132651620492237, "ground_truth": 0}, {"key": "26553115", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754067302269895, "ground_truth": 0}, {"key": "37872311", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8714748629761523, "ground_truth": 0}, {"key": "37872311", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5292633936264678, "ground_truth": 0}, {"key": "37872311", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8438951228790487, "ground_truth": 0}, {"key": "37872311", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9241418233998201, "ground_truth": 0}, {"key": "37872311", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744660688656, "ground_truth": 0}, {"key": "35553131", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8449215292672314, "ground_truth": 0}, {"key": "35553131", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8955226911119869, "ground_truth": 0}, {"key": "35553131", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8864204170838169, "ground_truth": 0}, {"key": "35553131", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.773216374778738, "ground_truth": 0}, {"key": "35553131", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920216727189, "ground_truth": 0}, {"key": "39038936", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6636689290103642, "ground_truth": 0}, {"key": "39038936", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7217432016077477, "ground_truth": 0}, {"key": "39038936", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6825737204788854, "ground_truth": 0}, {"key": "39038936", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641319073219, "ground_truth": 0}, {"key": "39038936", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633925660323, "ground_truth": 0}, {"key": "38735486", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9905874111796202, "ground_truth": 0}, {"key": "38735486", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9923637830485292, "ground_truth": 0}, {"key": "38735486", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9820137887425442, "ground_truth": 0}, {"key": "38735486", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9882221563420843, "ground_truth": 0}, {"key": "38735486", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9954261355146456, "ground_truth": 0}, {"key": "17087845", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48242908611501795, "ground_truth": 0}, {"key": "17087845", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47268348623321926, "ground_truth": 0}, {"key": "17087845", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6169358144780367, "ground_truth": 0}, {"key": "17087845", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417299865051, "ground_truth": 0}, {"key": "17087845", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988634195502, "ground_truth": 0}, {"key": "37443011", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6531269311439554, "ground_truth": 0}, {"key": "37443011", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7853085784818136, "ground_truth": 0}, {"key": "37443011", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5640984484632848, "ground_truth": 0}, {"key": "37443011", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137081652614, "ground_truth": 0}, {"key": "37443011", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615900495018, "ground_truth": 0}, {"key": "36855749", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7476159437219708, "ground_truth": 0}, {"key": "36855749", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7918210615684138, "ground_truth": 0}, {"key": "36855749", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8267118014011703, "ground_truth": 0}, {"key": "36855749", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036200620113, "ground_truth": 0}, {"key": "36855749", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772236898611, "ground_truth": 0}, {"key": "35613141", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6893056104434371, "ground_truth": 0}, {"key": "35613141", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7634837801505424, "ground_truth": 0}, {"key": "35613141", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8933094031089248, "ground_truth": 0}, {"key": "35613141", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467668096244, "ground_truth": 0}, {"key": "35613141", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804187684841, "ground_truth": 0}, {"key": "39088847", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6206216371741546, "ground_truth": 0}, {"key": "39088847", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3998116272950481, "ground_truth": 0}, {"key": "39088847", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45907611360882944, "ground_truth": 0}, {"key": "39088847", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735743946167354, "ground_truth": 0}, {"key": "39088847", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869690950827537, "ground_truth": 0}, {"key": "33197277", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7371581378392733, "ground_truth": 0}, {"key": "33197277", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7931059594120973, "ground_truth": 0}, {"key": "33197277", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7956580905864917, "ground_truth": 0}, {"key": "33197277", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441020884528, "ground_truth": 0}, {"key": "33197277", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253917240067, "ground_truth": 0}, {"key": "33815489", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4397473141077146, "ground_truth": 0}, {"key": "33815489", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4571367043336358, "ground_truth": 0}, {"key": "33815489", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.37387582084457155, "ground_truth": 0}, {"key": "33815489", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092207990040189, "ground_truth": 0}, {"key": "33815489", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.579400396559727, "ground_truth": 0}, {"key": "35862754", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7956581229385202, "ground_truth": 0}, {"key": "35862754", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8187368115717586, "ground_truth": 0}, {"key": "35862754", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7505527723855835, "ground_truth": 0}, {"key": "35862754", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933235893203, "ground_truth": 0}, {"key": "35862754", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.873214830085043, "ground_truth": 0}, {"key": "36080615", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2829881266458225, "ground_truth": 0}, {"key": "36080615", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4687905952863397, "ground_truth": 0}, {"key": "36080615", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3849121427394554, "ground_truth": 0}, {"key": "36080615", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011696926471, "ground_truth": 0}, {"key": "36080615", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766829182911056, "ground_truth": 0}, {"key": "22822742", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.844921531155577, "ground_truth": 0}, {"key": "22822742", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8056321849226353, "ground_truth": 0}, {"key": "22822742", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8679338429347844, "ground_truth": 0}, {"key": "22822742", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.893309400106067, "ground_truth": 0}, {"key": "22822742", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445554229567, "ground_truth": 0}, {"key": "39747536", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702662624411, "ground_truth": 0}, {"key": "39747536", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984667974576, "ground_truth": 0}, {"key": "39747536", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5869964345468888, "ground_truth": 0}, {"key": "39747536", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094763119985, "ground_truth": 0}, {"key": "39747536", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563608998018, "ground_truth": 0}, {"key": "34218396", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8386797638228143, "ground_truth": 0}, {"key": "34218396", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.858718589696359, "ground_truth": 0}, {"key": "34218396", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8397339704284629, "ground_truth": 0}, {"key": "34218396", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343684934877, "ground_truth": 0}, {"key": "34218396", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059189442874, "ground_truth": 0}, {"key": "39150388", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8175744841934885, "ground_truth": 0}, {"key": "39150388", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5428632699889051, "ground_truth": 0}, {"key": "39150388", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6187804393139479, "ground_truth": 0}, {"key": "39150388", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828340124871195, "ground_truth": 0}, {"key": "39150388", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3504213777324043, "ground_truth": 0}, {"key": "28765782", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8289388041800854, "ground_truth": 0}, {"key": "28765782", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7879311971900486, "ground_truth": 0}, {"key": "28765782", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.793105934154939, "ground_truth": 0}, {"key": "28765782", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437675307254, "ground_truth": 0}, {"key": "28765782", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245987127169, "ground_truth": 0}, {"key": "35828022", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48438006564692254, "ground_truth": 0}, {"key": "35828022", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238846821244, "ground_truth": 0}, {"key": "35828022", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.667147696521373, "ground_truth": 0}, {"key": "35828022", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551985883321226, "ground_truth": 0}, {"key": "35828022", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366205963879, "ground_truth": 0}, {"key": "27717735", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5506073763266519, "ground_truth": 0}, {"key": "27717735", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7918210673160172, "ground_truth": 0}, {"key": "27717735", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3720487616961938, "ground_truth": 0}, {"key": "27717735", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239966797437, "ground_truth": 0}, {"key": "27717735", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199073692342, "ground_truth": 0}, {"key": "37977826", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4571367101823984, "ground_truth": 0}, {"key": "37977826", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3451052661716217, "ground_truth": 0}, {"key": "37977826", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5640984984467221, "ground_truth": 0}, {"key": "37977826", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982141276382, "ground_truth": 0}, {"key": "37977826", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48047865501821874, "ground_truth": 0}, {"key": "31768588", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9105454030071827, "ground_truth": 0}, {"key": "31768588", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9532750403620964, "ground_truth": 0}, {"key": "31768588", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9026096051779601, "ground_truth": 0}, {"key": "31768588", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204068896319, "ground_truth": 0}, {"key": "31768588", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377770026522, "ground_truth": 0}, {"key": "37183351", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3849121422452802, "ground_truth": 0}, {"key": "37183351", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2689414231286388, "ground_truth": 0}, {"key": "37183351", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.414898830661535, "ground_truth": 0}, {"key": "37183351", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158249455198153, "ground_truth": 0}, {"key": "37183351", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586142799964, "ground_truth": 0}, {"key": "39622090", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.476579643548032, "ground_truth": 0}, {"key": "39622090", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35220177696223726, "ground_truth": 0}, {"key": "39622090", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5926666007468353, "ground_truth": 0}, {"key": "39622090", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033611575635, "ground_truth": 0}, {"key": "39622090", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3942009695023579, "ground_truth": 0}, {"key": "39272756", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5888891633423208, "ground_truth": 0}, {"key": "39272756", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5486735144768542, "ground_truth": 0}, {"key": "39272756", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3276682824994128, "ground_truth": 0}, {"key": "39272756", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850363459136, "ground_truth": 0}, {"key": "39272756", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125589358351, "ground_truth": 0}, {"key": "32138822", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48242908980760835, "ground_truth": 0}, {"key": "32138822", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5679366173662007, "ground_truth": 0}, {"key": "32138822", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6020615957834528, "ground_truth": 0}, {"key": "32138822", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337053782764, "ground_truth": 0}, {"key": "32138822", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666486439359, "ground_truth": 0}, {"key": "31070114", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.22000711147652072, "ground_truth": 0}, {"key": "31070114", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.20307461749808092, "ground_truth": 0}, {"key": "31070114", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.19436780167172904, "ground_truth": 0}, {"key": "31070114", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1356895447689681, "ground_truth": 0}, {"key": "31070114", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776333511354433, "ground_truth": 0}, {"key": "39652762", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.844921521212399, "ground_truth": 0}, {"key": "39652762", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8606036145938435, "ground_truth": 0}, {"key": "39652762", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8895288495162607, "ground_truth": 0}, {"key": "39652762", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389770166478, "ground_truth": 0}, {"key": "39652762", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619305399145, "ground_truth": 0}, {"key": "33258866", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37204875763277756, "ground_truth": 0}, {"key": "33258866", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6495786180809402, "ground_truth": 0}, {"key": "33258866", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46490156846212666, "ground_truth": 0}, {"key": "33258866", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852884155716024, "ground_truth": 0}, {"key": "33258866", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897205059931, "ground_truth": 0}, {"key": "36962388", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.663668950811186, "ground_truth": 0}, {"key": "36962388", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.23934935815092379, "ground_truth": 0}, {"key": "36962388", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.57749536588031, "ground_truth": 0}, {"key": "36962388", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666089555724, "ground_truth": 0}, {"key": "36962388", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984627540684, "ground_truth": 0}, {"key": "32282272", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.12002562832781453, "ground_truth": 0}, {"key": "32282272", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.07921032322023418, "ground_truth": 0}, {"key": "32282272", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31742628293457414, "ground_truth": 0}, {"key": "32282272", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1015894398090758, "ground_truth": 0}, {"key": "32282272", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577489625950287, "ground_truth": 0}, {"key": "36093072", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8947894646456055, "ground_truth": 0}, {"key": "36093072", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8661325060252425, "ground_truth": 0}, {"key": "36093072", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9012274180016296, "ground_truth": 0}, {"key": "36093072", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9273632927485672, "ground_truth": 0}, {"key": "36093072", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619094343326, "ground_truth": 0}, {"key": "38879972", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7106283058135859, "ground_truth": 0}, {"key": "38879972", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.799442324802406, "ground_truth": 0}, {"key": "38879972", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755879785768446, "ground_truth": 0}, {"key": "38879972", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631520566041, "ground_truth": 0}, {"key": "38879972", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195212914812174, "ground_truth": 0}, {"key": "32106473", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4921881341390175, "ground_truth": 0}, {"key": "32106473", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5926666144594452, "ground_truth": 0}, {"key": "32106473", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7461389836533048, "ground_truth": 0}, {"key": "32106473", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631555693094, "ground_truth": 0}, {"key": "32106473", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240080670349, "ground_truth": 0}, {"key": "40415815", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6057990264012453, "ground_truth": 0}, {"key": "40415815", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5019531070343921, "ground_truth": 0}, {"key": "40415815", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45907615365838633, "ground_truth": 0}, {"key": "40415815", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073927887835, "ground_truth": 0}, {"key": "40415815", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082840154138, "ground_truth": 0}, {"key": "34581918", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5292633764833585, "ground_truth": 0}, {"key": "34581918", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6261241529602474, "ground_truth": 0}, {"key": "34581918", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36840569139298923, "ground_truth": 0}, {"key": "34581918", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009344998934, "ground_truth": 0}, {"key": "34581918", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056148717533, "ground_truth": 0}, {"key": "33004157", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8856314742522915, "ground_truth": 0}, {"key": "33004157", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.867933847832929, "ground_truth": 0}, {"key": "33004157", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7676898560022556, "ground_truth": 0}, {"key": "33004157", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.867933838698234, "ground_truth": 0}, {"key": "33004157", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797590323922, "ground_truth": 0}, {"key": "30334943", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8714748593688127, "ground_truth": 0}, {"key": "30334943", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8140528158821825, "ground_truth": 0}, {"key": "30334943", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7264256027073104, "ground_truth": 0}, {"key": "30334943", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089231255331, "ground_truth": 0}, {"key": "30334943", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210753938651, "ground_truth": 0}, {"key": "33280503", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3415825018697548, "ground_truth": 0}, {"key": "33280503", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4882833791619452, "ground_truth": 0}, {"key": "33280503", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3593641489658444, "ground_truth": 0}, {"key": "33280503", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414088428595704, "ground_truth": 0}, {"key": "33280503", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526421263796, "ground_truth": 0}, {"key": "25726782", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8354835191123943, "ground_truth": 0}, {"key": "25726782", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8799743789799558, "ground_truth": 0}, {"key": "25726782", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9124361562643024, "ground_truth": 0}, {"key": "25726782", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583539735843, "ground_truth": 0}, {"key": "25726782", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632902979654, "ground_truth": 0}, {"key": "35479854", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7325918201577407, "ground_truth": 0}, {"key": "35479854", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6039318428490964, "ground_truth": 0}, {"key": "35479854", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8006920125969186, "ground_truth": 0}, {"key": "35479854", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082801601093, "ground_truth": 0}, {"key": "35479854", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943891571642, "ground_truth": 0}, {"key": "32716226", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4092208348320741, "ground_truth": 0}, {"key": "32716226", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49804686657228675, "ground_truth": 0}, {"key": "32716226", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6039318506270505, "ground_truth": 0}, {"key": "32716226", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033586518708, "ground_truth": 0}, {"key": "32716226", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.690976294289688, "ground_truth": 0}, {"key": "37047554", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2583259582860614, "ground_truth": 0}, {"key": "37047554", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4921881417000034, "ground_truth": 0}, {"key": "37047554", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5097644048649814, "ground_truth": 0}, {"key": "37047554", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28457600829523333, "ground_truth": 0}, {"key": "37047554", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.26740816972922465, "ground_truth": 0}, {"key": "36565290", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8774767766707983, "ground_truth": 0}, {"key": "36565290", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7918210849152537, "ground_truth": 0}, {"key": "36565290", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7879312030062862, "ground_truth": 0}, {"key": "36565290", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587957299585, "ground_truth": 0}, {"key": "36565290", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.889528855913446, "ground_truth": 0}, {"key": "27758640", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.823328404561818, "ground_truth": 0}, {"key": "27758640", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5794004099392576, "ground_truth": 0}, {"key": "27758640", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6842640261871675, "ground_truth": 0}, {"key": "27758640", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723614248666, "ground_truth": 0}, {"key": "27758640", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916152055226, "ground_truth": 0}, {"key": "28897118", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548638501849, "ground_truth": 0}, {"key": "28897118", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4474603393225037, "ground_truth": 0}, {"key": "28897118", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6909762868802547, "ground_truth": 0}, {"key": "28897118", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437586350671, "ground_truth": 0}, {"key": "28897118", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619229008267987, "ground_truth": 0}, {"key": "38452661", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9485372392907132, "ground_truth": 0}, {"key": "38452661", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8140528228285079, "ground_truth": 0}, {"key": "38452661", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8164063804593571, "ground_truth": 0}, {"key": "38452661", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.775944573004047, "ground_truth": 0}, {"key": "38452661", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872079169765, "ground_truth": 0}, {"key": "38033492", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4843800659691149, "ground_truth": 0}, {"key": "38033492", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.640635875427134, "ground_truth": 0}, {"key": "38033492", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6636689488338692, "ground_truth": 0}, {"key": "38033492", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365437335441, "ground_truth": 0}, {"key": "38033492", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593268007685, "ground_truth": 0}, {"key": "35949555", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8774767900130993, "ground_truth": 0}, {"key": "35949555", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9178933683413736, "ground_truth": 0}, {"key": "35949555", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8807970672113762, "ground_truth": 0}, {"key": "35949555", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9207896770864092, "ground_truth": 0}, {"key": "35949555", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9390248134070495, "ground_truth": 0}, {"key": "15263826", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5640984589909904, "ground_truth": 0}, {"key": "15263826", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5175708749626213, "ground_truth": 0}, {"key": "15263826", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6206216110837423, "ground_truth": 0}, {"key": "15263826", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122089969838, "ground_truth": 0}, {"key": "15263826", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185166254889, "ground_truth": 0}, {"key": "37313866", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.910545397996038, "ground_truth": 0}, {"key": "37313866", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6926419581114226, "ground_truth": 0}, {"key": "37313866", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7745833913739898, "ground_truth": 0}, {"key": "37313866", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239752274933, "ground_truth": 0}, {"key": "37313866", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241504408816, "ground_truth": 0}, {"key": "13911157", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8947894704564052, "ground_truth": 0}, {"key": "13911157", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9553191303002214, "ground_truth": 0}, {"key": "13911157", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9053222973037591, "ground_truth": 0}, {"key": "13911157", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110495220598, "ground_truth": 0}, {"key": "13911157", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107861664304, "ground_truth": 0}, {"key": "39594894", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "39594894", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185204101108, "ground_truth": 0}, {"key": "39594894", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4130035456238486, "ground_truth": 0}, {"key": "39594894", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684556831491436, "ground_truth": 0}, {"key": "39594894", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665863905394, "ground_truth": 0}, {"key": "34096170", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8044059197576728, "ground_truth": 0}, {"key": "34096170", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6001883592963521, "ground_truth": 0}, {"key": "34096170", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8198933421295139, "ground_truth": 0}, {"key": "34096170", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.615087838999824, "ground_truth": 0}, {"key": "34096170", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.729519764430292, "ground_truth": 0}, {"key": "37891952", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9842154400159652, "ground_truth": 0}, {"key": "37891952", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.985718066557714, "ground_truth": 0}, {"key": "37891952", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9834704437596694, "ground_truth": 0}, {"key": "37891952", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9693241969043475, "ground_truth": 0}, {"key": "37891952", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9697854138643967, "ground_truth": 0}, {"key": "40186158", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6057990434167287, "ground_truth": 0}, {"key": "40186158", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4016877992382314, "ground_truth": 0}, {"key": "40186158", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5078118474677275, "ground_truth": 0}, {"key": "40186158", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004068436147, "ground_truth": 0}, {"key": "40186158", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792063708266, "ground_truth": 0}, {"key": "37049719", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6757645877830876, "ground_truth": 0}, {"key": "37049719", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7217432160050044, "ground_truth": 0}, {"key": "37049719", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8615382045222887, "ground_truth": 0}, {"key": "37049719", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251150575886, "ground_truth": 0}, {"key": "37049719", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804398130687, "ground_truth": 0}, {"key": "34610504", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8910549591841594, "ground_truth": 0}, {"key": "34610504", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8918110421431218, "ground_truth": 0}, {"key": "34610504", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9118099541687317, "ground_truth": 0}, {"key": "34610504", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467697259278, "ground_truth": 0}, {"key": "34610504", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215240728517, "ground_truth": 0}, {"key": "37595429", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8128673168944549, "ground_truth": 0}, {"key": "37595429", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7662936320162421, "ground_truth": 0}, {"key": "37595429", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7879311976904657, "ground_truth": 0}, {"key": "37595429", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.767689860667758, "ground_truth": 0}, {"key": "37595429", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909763022800927, "ground_truth": 0}, {"key": "29772670", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.14318770549015383, "ground_truth": 0}, {"key": "29772670", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41489884104104263, "ground_truth": 0}, {"key": "29772670", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.37754067593181234, "ground_truth": 0}, {"key": "29772670", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591064923704, "ground_truth": 0}, {"key": "29772670", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798744334085399, "ground_truth": 0}, {"key": "36369872", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5755880164907694, "ground_truth": 0}, {"key": "36369872", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41869692288803284, "ground_truth": 0}, {"key": "36369872", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5698526494835617, "ground_truth": 0}, {"key": "36369872", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758359306258, "ground_truth": 0}, {"key": "36369872", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013627254668, "ground_truth": 0}, {"key": "34527433", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4765796437620807, "ground_truth": 0}, {"key": "34527433", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.32423539623307973, "ground_truth": 0}, {"key": "34527433", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4785288390134265, "ground_truth": 0}, {"key": "34527433", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474602957416603, "ground_truth": 0}, {"key": "34527433", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618659549392, "ground_truth": 0}, {"key": "31111734", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7931059671945839, "ground_truth": 0}, {"key": "31111734", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7154240097072811, "ground_truth": 0}, {"key": "31111734", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6315943374947219, "ground_truth": 0}, {"key": "31111734", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307586434154, "ground_truth": 0}, {"key": "31111734", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125718787516, "ground_truth": 0}, {"key": "40303872", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6619228759401486, "ground_truth": 0}, {"key": "40303872", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7981867666602033, "ground_truth": 0}, {"key": "40303872", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5679366520090581, "ground_truth": 0}, {"key": "40303872", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867942726741, "ground_truth": 0}, {"key": "40303872", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884539405071, "ground_truth": 0}, {"key": "33653553", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5292633801342376, "ground_truth": 0}, {"key": "33653553", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6688802611654393, "ground_truth": 0}, {"key": "33653553", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6334102527990968, "ground_truth": 0}, {"key": "33653553", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570648354085956, "ground_truth": 0}, {"key": "33653553", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704545158563, "ground_truth": 0}, {"key": "34404510", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8255897077141505, "ground_truth": 0}, {"key": "34404510", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.646013689582136, "ground_truth": 0}, {"key": "34404510", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5774953739045869, "ground_truth": 0}, {"key": "34404510", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197778276611, "ground_truth": 0}, {"key": "34404510", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.724870256481788, "ground_truth": 0}, {"key": "35568692", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4073334103086613, "ground_truth": 0}, {"key": "35568692", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1766716019072458, "ground_truth": 0}, {"key": "35568692", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2568320002775455, "ground_truth": 0}, {"key": "35568692", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259838760708, "ground_truth": 0}, {"key": "35568692", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.275129733847578, "ground_truth": 0}, {"key": "39151664", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3960681591152104, "ground_truth": 0}, {"key": "39151664", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5755879731288763, "ground_truth": 0}, {"key": "39151664", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.26894142477326194, "ground_truth": 0}, {"key": "39151664", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937837576712796, "ground_truth": 0}, {"key": "39151664", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451170225503, "ground_truth": 0}, {"key": "37493670", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9963214909280315, "ground_truth": 0}, {"key": "37493670", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9989098100042482, "ground_truth": 0}, {"key": "37493670", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9978510506994679, "ground_truth": 0}, {"key": "37493670", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9978172834869556, "ground_truth": 0}, {"key": "37493670", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9981030799079371, "ground_truth": 0}, {"key": "21935983", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3073580134125729, "ground_truth": 0}, {"key": "21935983", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3415825121388104, "ground_truth": 0}, {"key": "21935983", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2613309354583696, "ground_truth": 0}, {"key": "21935983", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081628673938, "ground_truth": 0}, {"key": "21935983", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1801066641001446, "ground_truth": 0}, {"key": "38174214", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6976089194987386, "ground_truth": 0}, {"key": "38174214", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7520125653788927, "ground_truth": 0}, {"key": "38174214", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7520125593416307, "ground_truth": 0}, {"key": "38174214", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672109152263, "ground_truth": 0}, {"key": "38174214", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837742029227, "ground_truth": 0}, {"key": "40319923", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7905303188250885, "ground_truth": 0}, {"key": "40319923", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9257686262700958, "ground_truth": 0}, {"key": "40319923", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7356416378662803, "ground_truth": 0}, {"key": "40319923", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666777084168, "ground_truth": 0}, {"key": "40319923", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933772616718, "ground_truth": 0}, {"key": "36478264", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.523420362636058, "ground_truth": 0}, {"key": "36478264", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7154239844315388, "ground_truth": 0}, {"key": "36478264", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8198933375278876, "ground_truth": 0}, {"key": "36478264", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933366157884, "ground_truth": 0}, {"key": "36478264", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165302645286, "ground_truth": 0}, {"key": "11935769", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5983121852368688, "ground_truth": 0}, {"key": "11935769", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185298325169, "ground_truth": 0}, {"key": "11935769", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432069997899, "ground_truth": 0}, {"key": "11935769", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737304340905, "ground_truth": 0}, {"key": "11935769", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.750552763422851, "ground_truth": 0}, {"key": "33373410", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.18594720381597918, "ground_truth": 0}, {"key": "33373410", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2845760098509694, "ground_truth": 0}, {"key": "33373410", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.17441027431839923, "ground_truth": 0}, {"key": "33373410", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.23934934142798367, "ground_truth": 0}, {"key": "33373410", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197363290991, "ground_truth": 0}, {"key": "11130680", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872182600808, "ground_truth": 0}, {"key": "11130680", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8255897468163584, "ground_truth": 0}, {"key": "11130680", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.20946968066258698, "ground_truth": 0}, {"key": "11130680", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.836554553652411, "ground_truth": 0}, {"key": "11130680", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743747812888, "ground_truth": 0}, {"key": "34868650", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6442251194840386, "ground_truth": 0}, {"key": "34868650", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5602526726107369, "ground_truth": 0}, {"key": "34868650", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8140528200726582, "ground_truth": 0}, {"key": "34868650", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201715045418965, "ground_truth": 0}, {"key": "34868650", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.749087228235935, "ground_truth": 0}, {"key": "33960561", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48438006158413005, "ground_truth": 0}, {"key": "33960561", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4148988129447493, "ground_truth": 0}, {"key": "33960561", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5019530976044799, "ground_truth": 0}, {"key": "33960561", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216148826609, "ground_truth": 0}, {"key": "33960561", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3575675387658379, "ground_truth": 0}, {"key": "22504858", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7325918428751242, "ground_truth": 0}, {"key": "22504858", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5428632771224406, "ground_truth": 0}, {"key": "22504858", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7943849644843531, "ground_truth": 0}, {"key": "22504858", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526055367043, "ground_truth": 0}, {"key": "22504858", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786942236225, "ground_truth": 0}, {"key": "32283530", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6388352824358582, "ground_truth": 0}, {"key": "32283530", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5350984077980715, "ground_truth": 0}, {"key": "32283530", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7799929019014519, "ground_truth": 0}, {"key": "32283530", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288356465599, "ground_truth": 0}, {"key": "32283530", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256162039804, "ground_truth": 0}, {"key": "38377099", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8479677558569833, "ground_truth": 0}, {"key": "38377099", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6495786118353021, "ground_truth": 0}, {"key": "38377099", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8175744800586073, "ground_truth": 0}, {"key": "38377099", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797711484268, "ground_truth": 0}, {"key": "38377099", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185847382465, "ground_truth": 0}, {"key": "36105123", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9161096189965653, "ground_truth": 0}, {"key": "36105123", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9309620740639747, "ground_truth": 0}, {"key": "36105123", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9469902306294191, "ground_truth": 0}, {"key": "36105123", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9407897495811048, "ground_truth": 0}, {"key": "36105123", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.812867309886652, "ground_truth": 0}, {"key": "33527826", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7563575611052861, "ground_truth": 0}, {"key": "33527826", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8670357498531025, "ground_truth": 0}, {"key": "33527826", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8031737989763881, "ground_truth": 0}, {"key": "33527826", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288430816414, "ground_truth": 0}, {"key": "33527826", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923170133623, "ground_truth": 0}, {"key": "32349891", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5964331245430466, "ground_truth": 0}, {"key": "32349891", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7201714948309215, "ground_truth": 0}, {"key": "32349891", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7534666519096549, "ground_truth": 0}, {"key": "32349891", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666546872809, "ground_truth": 0}, {"key": "32349891", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737927571209, "ground_truth": 0}, {"key": "34281974", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6169358117533351, "ground_truth": 0}, {"key": "34281974", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6039318361371994, "ground_truth": 0}, {"key": "34281974", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7918210853620664, "ground_truth": 0}, {"key": "34281974", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419673137579, "ground_truth": 0}, {"key": "34281974", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544248043924, "ground_truth": 0}, {"key": "29387866", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6279511876841148, "ground_truth": 0}, {"key": "29387866", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22000709599355306, "ground_truth": 0}, {"key": "29387866", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5097643991309853, "ground_truth": 0}, {"key": "29387866", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736783966291435, "ground_truth": 0}, {"key": "29387866", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420094119798965, "ground_truth": 0}, {"key": "35731925", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9950945940218129, "ground_truth": 0}, {"key": "35731925", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9954967277340565, "ground_truth": 0}, {"key": "35731925", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9775429458791856, "ground_truth": 0}, {"key": "35731925", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9761291656285134, "ground_truth": 0}, {"key": "35731925", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9944450748869549, "ground_truth": 0}, {"key": "38829733", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7549149881771836, "ground_truth": 0}, {"key": "38829733", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8633916141807869, "ground_truth": 0}, {"key": "38829733", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6909763027737307, "ground_truth": 0}, {"key": "38829733", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105527942525, "ground_truth": 0}, {"key": "38829733", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.874077241159161, "ground_truth": 0}, {"key": "24624736", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8397339469823093, "ground_truth": 0}, {"key": "24624736", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9184802400516682, "ground_truth": 0}, {"key": "24624736", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359764055121, "ground_truth": 0}, {"key": "24624736", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578459487213, "ground_truth": 0}, {"key": "24624736", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145783474666, "ground_truth": 0}, {"key": "36928562", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9744347863335643, "ground_truth": 0}, {"key": "36928562", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9643214493504917, "ground_truth": 0}, {"key": "36928562", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9621075721644159, "ground_truth": 0}, {"key": "36928562", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9842154380125847, "ground_truth": 0}, {"key": "36928562", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9704646619902846, "ground_truth": 0}, {"key": "34941119", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7676898564180608, "ground_truth": 0}, {"key": "34941119", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.42632158973733986, "ground_truth": 0}, {"key": "34941119", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5331544001630333, "ground_truth": 0}, {"key": "34941119", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591402187768, "ground_truth": 0}, {"key": "34941119", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132648700228056, "ground_truth": 0}, {"key": "30206231", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44746026989776966, "ground_truth": 0}, {"key": "30206231", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3208212950271229, "ground_truth": 0}, {"key": "30206231", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5175708676268879, "ground_truth": 0}, {"key": "30206231", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381560871953, "ground_truth": 0}, {"key": "30206231", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832010913013, "ground_truth": 0}, {"key": "35584972", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.46879064298618184, "ground_truth": 0}, {"key": "35584972", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5794003896742997, "ground_truth": 0}, {"key": "35584972", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6619228992056198, "ground_truth": 0}, {"key": "35584972", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4397473483251028, "ground_truth": 0}, {"key": "35584972", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575764191006, "ground_truth": 0}, {"key": "39277709", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9465966734779429, "ground_truth": 0}, {"key": "39277709", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9640516749727617, "ground_truth": 0}, {"key": "39277709", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9433475733618472, "ground_truth": 0}, {"key": "39277709", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240748790542, "ground_truth": 0}, {"key": "39277709", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036176546479, "ground_truth": 0}, {"key": "36123657", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8255897142107537, "ground_truth": 0}, {"key": "36123657", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7786493160039724, "ground_truth": 0}, {"key": "36123657", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.777299861839964, "ground_truth": 0}, {"key": "36123657", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191549615935, "ground_truth": 0}, {"key": "36123657", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982087181923, "ground_truth": 0}, {"key": "33363938", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7620701055411687, "ground_truth": 0}, {"key": "33363938", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5851011185713858, "ground_truth": 0}, {"key": "33363938", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7690802296514985, "ground_truth": 0}, {"key": "33363938", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8955226755004149, "ground_truth": 0}, {"key": "33363938", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085816040003, "ground_truth": 0}, {"key": "37349129", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7826624735167098, "ground_truth": 0}, {"key": "37349129", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6224593269876697, "ground_truth": 0}, {"key": "37349129", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7839884657875537, "ground_truth": 0}, {"key": "37349129", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318235677391, "ground_truth": 0}, {"key": "37349129", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666496221869, "ground_truth": 0}, {"key": "37160199", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4035668471503862, "ground_truth": 0}, {"key": "37160199", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5234203315129958, "ground_truth": 0}, {"key": "37160199", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5660185120333172, "ground_truth": 0}, {"key": "37160199", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366066308149, "ground_truth": 0}, {"key": "37160199", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37570646108486305, "ground_truth": 0}, {"key": "35891053", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8449215205676924, "ground_truth": 0}, {"key": "35891053", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9289263264165175, "ground_truth": 0}, {"key": "35891053", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9079671425001018, "ground_truth": 0}, {"key": "35891053", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392890907119, "ground_truth": 0}, {"key": "35891053", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210892629232, "ground_truth": 0}, {"key": "40694542", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6261241883533456, "ground_truth": 0}, {"key": "40694542", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6132365521875476, "ground_truth": 0}, {"key": "40694542", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7057850374625967, "ground_truth": 0}, {"key": "40694542", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089136626202, "ground_truth": 0}, {"key": "40694542", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308203641759, "ground_truth": 0}, {"key": "24645770", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6076631790813222, "ground_truth": 0}, {"key": "24645770", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6057990612675312, "ground_truth": 0}, {"key": "24645770", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7074046708834405, "ground_truth": 0}, {"key": "24645770", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684690547467, "ground_truth": 0}, {"key": "24645770", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666032932327, "ground_truth": 0}, {"key": "37974587", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7918210887646642, "ground_truth": 0}, {"key": "37974587", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9314625062044455, "ground_truth": 0}, {"key": "37974587", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8428631320680745, "ground_truth": 0}, {"key": "37974587", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.794384973370457, "ground_truth": 0}, {"key": "37974587", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424417935253, "ground_truth": 0}, {"key": "40354149", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7745833978889773, "ground_truth": 0}, {"key": "40354149", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8529354753165039, "ground_truth": 0}, {"key": "40354149", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7956581168044329, "ground_truth": 0}, {"key": "40354149", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.754914999765361, "ground_truth": 0}, {"key": "40354149", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358737796513, "ground_truth": 0}, {"key": "35519470", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2281565030845805, "ground_truth": 0}, {"key": "35519470", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5195212995418687, "ground_truth": 0}, {"key": "35519470", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.25238402536508614, "ground_truth": 0}, {"key": "35519470", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864512728589403, "ground_truth": 0}, {"key": "35519470", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064793409462, "ground_truth": 0}, {"key": "36185624", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.806852629479433, "ground_truth": 0}, {"key": "36185624", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7620701039682168, "ground_truth": 0}, {"key": "36185624", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.841825652752866, "ground_truth": 0}, {"key": "36185624", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253691693138, "ground_truth": 0}, {"key": "36185624", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869880586846, "ground_truth": 0}, {"key": "39306113", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.302391096058883, "ground_truth": 0}, {"key": "39306113", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5389832088220987, "ground_truth": 0}, {"key": "39306113", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30239108926934644, "ground_truth": 0}, {"key": "39306113", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238404161309796, "ground_truth": 0}, {"key": "39306113", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262669252661, "ground_truth": 0}, {"key": "19347718", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8092759807453082, "ground_truth": 0}, {"key": "19347718", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5602526894542307, "ground_truth": 0}, {"key": "19347718", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7025300781254906, "ground_truth": 0}, {"key": "19347718", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601356637315, "ground_truth": 0}, {"key": "19347718", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.697608920601943, "ground_truth": 0}, {"key": "21870064", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4902356185027016, "ground_truth": 0}, {"key": "21870064", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.27512973557035464, "ground_truth": 0}, {"key": "21870064", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.24077460583692928, "ground_truth": 0}, {"key": "21870064", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2893717181143788, "ground_truth": 0}, {"key": "21870064", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268349605451676, "ground_truth": 0}, {"key": "37675776", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9130583577146345, "ground_truth": 0}, {"key": "37675776", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8661325159152393, "ground_truth": 0}, {"key": "37675776", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8606036154548763, "ground_truth": 0}, {"key": "37675776", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970699460794, "ground_truth": 0}, {"key": "37675776", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105454000193983, "ground_truth": 0}, {"key": "38107017", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6723316998232205, "ground_truth": 0}, {"key": "38107017", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7371581606721638, "ground_truth": 0}, {"key": "38107017", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7090191284413998, "ground_truth": 0}, {"key": "38107017", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765031578452, "ground_truth": 0}, {"key": "38107017", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442250878646971, "ground_truth": 0}, {"key": "40046472", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.33807710855195916, "ground_truth": 0}, {"key": "40046472", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3539862827052784, "ground_truth": 0}, {"key": "40046472", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6334102538940494, "ground_truth": 0}, {"key": "40046472", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408979376867, "ground_truth": 0}, {"key": "40046472", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.28937168842002253, "ground_truth": 0}, {"key": "32157820", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6706082590530734, "ground_truth": 0}, {"key": "32157820", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6460137052754826, "ground_truth": 0}, {"key": "32157820", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5448014136531156, "ground_truth": 0}, {"key": "32157820", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922083004375404, "ground_truth": 0}, {"key": "32157820", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990508529305, "ground_truth": 0}, {"key": "41004037", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7676898434232052, "ground_truth": 0}, {"key": "41004037", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6791786875421403, "ground_truth": 0}, {"key": "41004037", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6531269178005391, "ground_truth": 0}, {"key": "41004037", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526585999785, "ground_truth": 0}, {"key": "41004037", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715049070512, "ground_truth": 0}, {"key": "21387993", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47657961428102846, "ground_truth": 0}, {"key": "21387993", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786263976754, "ground_truth": 0}, {"key": "21387993", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8056321849374909, "ground_truth": 0}, {"key": "21387993", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216245542677, "ground_truth": 0}, {"key": "21387993", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073549007627, "ground_truth": 0}, {"key": "34665539", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5983121742751384, "ground_truth": 0}, {"key": "34665539", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4765796466432469, "ground_truth": 0}, {"key": "34665539", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794003661018543, "ground_truth": 0}, {"key": "34665539", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.651354860796048, "ground_truth": 0}, {"key": "34665539", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883553998226, "ground_truth": 0}, {"key": "37872111", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3225259688369683, "ground_truth": 0}, {"key": "37872111", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5467381456790432, "ground_truth": 0}, {"key": "37872111", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7745833885753328, "ground_truth": 0}, {"key": "37872111", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238506174207, "ground_truth": 0}, {"key": "37872111", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640405582406, "ground_truth": 0}, {"key": "36629542", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8140527964797122, "ground_truth": 0}, {"key": "36629542", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.546738143120158, "ground_truth": 0}, {"key": "36629542", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494654897702, "ground_truth": 0}, {"key": "36629542", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.821044111940726, "ground_truth": 0}, {"key": "36629542", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740096148169, "ground_truth": 0}, {"key": "36487527", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8955226713069486, "ground_truth": 0}, {"key": "36487527", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6825737471730378, "ground_truth": 0}, {"key": "36487527", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8489721977437611, "ground_truth": 0}, {"key": "36487527", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677625309906, "ground_truth": 0}, {"key": "36487527", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869988603115, "ground_truth": 0}, {"key": "37344756", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8568122894809791, "ground_truth": 0}, {"key": "37344756", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7138307340487103, "ground_truth": 0}, {"key": "37344756", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8418256424587633, "ground_truth": 0}, {"key": "37344756", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593423860479, "ground_truth": 0}, {"key": "37344756", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897254975103, "ground_truth": 0}, {"key": "38707722", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5039061512820056, "ground_truth": 0}, {"key": "38707722", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38306419261165187, "ground_truth": 0}, {"key": "38707722", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.22678363014843606, "ground_truth": 0}, {"key": "38707722", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531204339965, "ground_truth": 0}, {"key": "38707722", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964451323004, "ground_truth": 0}, {"key": "37093419", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3720487866468783, "ground_truth": 0}, {"key": "37093419", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.0637149958028452, "ground_truth": 0}, {"key": "37093419", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1613202419305178, "ground_truth": 0}, {"key": "37093419", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952109110180723, "ground_truth": 0}, {"key": "37093419", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1688569591023291, "ground_truth": 0}, {"key": "35547391", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.35220178216113673, "ground_truth": 0}, {"key": "35547391", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6876300091685019, "ground_truth": 0}, {"key": "35547391", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.23510837986299074, "ground_truth": 0}, {"key": "35547391", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676344889465564, "ground_truth": 0}, {"key": "35547391", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3259495120045538, "ground_truth": 0}, {"key": "37173168", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6370307928687935, "ground_truth": 0}, {"key": "37173168", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238659018815, "ground_truth": 0}, {"key": "37173168", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7122321865989522, "ground_truth": 0}, {"key": "37173168", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216208194729, "ground_truth": 0}, {"key": "37173168", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014213412211, "ground_truth": 0}, {"key": "30725298", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6424324876284025, "ground_truth": 0}, {"key": "30725298", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.598312188366308, "ground_truth": 0}, {"key": "30725298", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.663668949875911, "ground_truth": 0}, {"key": "30725298", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990696761434, "ground_truth": 0}, {"key": "30725298", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837816977746, "ground_truth": 0}, {"key": "33830573", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7431679991267175, "ground_truth": 0}, {"key": "33830573", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6601723908678451, "ground_truth": 0}, {"key": "33830573", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9046505377103667, "ground_truth": 0}, {"key": "33830573", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382088335489, "ground_truth": 0}, {"key": "33830573", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684696903407, "ground_truth": 0}, {"key": "33415474", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.11676401869006907, "ground_truth": 0}, {"key": "33415474", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.08389038829556954, "ground_truth": 0}, {"key": "33415474", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.11516223938841894, "ground_truth": 0}, {"key": "33415474", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213611153149, "ground_truth": 0}, {"key": "33415474", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469142645115613, "ground_truth": 0}, {"key": "37383994", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.866132518998394, "ground_truth": 0}, {"key": "37383994", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.894051714328519, "ground_truth": 0}, {"key": "37383994", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9105453995168786, "ground_truth": 0}, {"key": "37383994", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923233561479, "ground_truth": 0}, {"key": "37383994", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314693158107, "ground_truth": 0}, {"key": "38576819", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.827828163208243, "ground_truth": 0}, {"key": "38576819", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786257707039, "ground_truth": 0}, {"key": "38576819", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4804786786997433, "ground_truth": 0}, {"key": "38576819", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933314487048, "ground_truth": 0}, {"key": "38576819", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690875007784, "ground_truth": 0}, {"key": "34500226", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5448014025418002, "ground_truth": 0}, {"key": "34500226", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5698526645589865, "ground_truth": 0}, {"key": "34500226", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44360041968919195, "ground_truth": 0}, {"key": "34500226", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935145132049, "ground_truth": 0}, {"key": "34500226", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121992514542, "ground_truth": 0}, {"key": "39856394", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702998916918, "ground_truth": 0}, {"key": "39856394", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324946549916, "ground_truth": 0}, {"key": "39856394", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7839884575081466, "ground_truth": 0}, {"key": "39856394", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754715355228, "ground_truth": 0}, {"key": "39856394", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102677169732, "ground_truth": 0}, {"key": "35499522", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.11920292774235558, "ground_truth": 0}, {"key": "35499522", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2160115234132049, "ground_truth": 0}, {"key": "35499522", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.11676401457193025, "ground_truth": 0}, {"key": "35499522", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713684938830005, "ground_truth": 0}, {"key": "35499522", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575982382593, "ground_truth": 0}, {"key": "30157766", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7520125765236743, "ground_truth": 0}, {"key": "30157766", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8615382193177121, "ground_truth": 0}, {"key": "30157766", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8140528128378033, "ground_truth": 0}, {"key": "30157766", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338286048326, "ground_truth": 0}, {"key": "30157766", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631286936783, "ground_truth": 0}, {"key": "40472346", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.72642561044029, "ground_truth": 0}, {"key": "40472346", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7122322003132431, "ground_truth": 0}, {"key": "40472346", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.83332459925816, "ground_truth": 0}, {"key": "40472346", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527627777011, "ground_truth": 0}, {"key": "40472346", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036053760096, "ground_truth": 0}, {"key": "35305635", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8548846367332382, "ground_truth": 0}, {"key": "35305635", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8749346212264305, "ground_truth": 0}, {"key": "35305635", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9032941936871003, "ground_truth": 0}, {"key": "35305635", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9437636560695406, "ground_truth": 0}, {"key": "35305635", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576226850213, "ground_truth": 0}, {"key": "32495926", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7341195523251739, "ground_truth": 0}, {"key": "32495926", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819516510192, "ground_truth": 0}, {"key": "32495926", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6808786084922458, "ground_truth": 0}, {"key": "32495926", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701022940745, "ground_truth": 0}, {"key": "32495926", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548489334354, "ground_truth": 0}, {"key": "37353801", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3259495122057496, "ground_truth": 0}, {"key": "37353801", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3504213917370052, "ground_truth": 0}, {"key": "37353801", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.38306416493138173, "ground_truth": 0}, {"key": "37353801", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591009903435, "ground_truth": 0}, {"key": "37353801", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736783899790602, "ground_truth": 0}, {"key": "30159904", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.687629974502692, "ground_truth": 0}, {"key": "30159904", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5525397071939403, "ground_truth": 0}, {"key": "30159904", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7577943938696284, "ground_truth": 0}, {"key": "30159904", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666055545615, "ground_truth": 0}, {"key": "30159904", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118553844253, "ground_truth": 0}, {"key": "33698679", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.57749536303142, "ground_truth": 0}, {"key": "33698679", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5563995936875171, "ground_truth": 0}, {"key": "33698679", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6943026706968284, "ground_truth": 0}, {"key": "33698679", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366080150414, "ground_truth": 0}, {"key": "33698679", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583423141793, "ground_truth": 0}, {"key": "40530172", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8633916031102263, "ground_truth": 0}, {"key": "40530172", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7295197739370219, "ground_truth": 0}, {"key": "40530172", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6169358370422899, "ground_truth": 0}, {"key": "40530172", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762945480247, "ground_truth": 0}, {"key": "40530172", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118765829554, "ground_truth": 0}, {"key": "40652941", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9309620807111316, "ground_truth": 0}, {"key": "40652941", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.626124174120347, "ground_truth": 0}, {"key": "40652941", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.783988469800638, "ground_truth": 0}, {"key": "40652941", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897256691649, "ground_truth": 0}, {"key": "40652941", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430386523225, "ground_truth": 0}, {"key": "40122246", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43206338620381096, "ground_truth": 0}, {"key": "40122246", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2720245571802825, "ground_truth": 0}, {"key": "40122246", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3073580047112516, "ground_truth": 0}, {"key": "40122246", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.15102780488110584, "ground_truth": 0}, {"key": "40122246", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.30735802590277894, "ground_truth": 0}, {"key": "40032656", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8587185812776842, "ground_truth": 0}, {"key": "40032656", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7786493149904953, "ground_truth": 0}, {"key": "40032656", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7745833860506139, "ground_truth": 0}, {"key": "40032656", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526206135633, "ground_truth": 0}, {"key": "40032656", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026789723342, "ground_truth": 0}, {"key": "38913680", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6206216307230221, "ground_truth": 0}, {"key": "38913680", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37754069598410706, "ground_truth": 0}, {"key": "38913680", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5467381501301091, "ground_truth": 0}, {"key": "38913680", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784178620279, "ground_truth": 0}, {"key": "38913680", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756753651645784, "ground_truth": 0}, {"key": "17608039", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.24798742518273478, "ground_truth": 0}, {"key": "17608039", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.33982758471137947, "ground_truth": 0}, {"key": "17608039", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.21866936437601325, "ground_truth": 0}, {"key": "17608039", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921741129144648, "ground_truth": 0}, {"key": "17608039", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.319121353222978, "ground_truth": 0}, {"key": "40434901", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8757869773093312, "ground_truth": 0}, {"key": "40434901", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8783142489522853, "ground_truth": 0}, {"key": "40434901", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9309620788812009, "ground_truth": 0}, {"key": "40434901", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110386909242, "ground_truth": 0}, {"key": "40434901", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441065488675, "ground_truth": 0}, {"key": "37680058", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.09670578818846937, "ground_truth": 0}, {"key": "37680058", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2798284932115699, "ground_truth": 0}, {"key": "37680058", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.304041662691369, "ground_truth": 0}, {"key": "37680058", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2523840572309544, "ground_truth": 0}, {"key": "37680058", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285233385572116, "ground_truth": 0}, {"key": "37291821", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6688802684040693, "ground_truth": 0}, {"key": "37291821", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6566582843629251, "ground_truth": 0}, {"key": "37291821", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5660185112569468, "ground_truth": 0}, {"key": "37291821", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601284620613, "ground_truth": 0}, {"key": "37291821", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.836554575451299, "ground_truth": 0}, {"key": "41002743", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5544704577650288, "ground_truth": 0}, {"key": "41002743", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5888891511892704, "ground_truth": 0}, {"key": "41002743", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5563995676047481, "ground_truth": 0}, {"key": "41002743", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321774388249, "ground_truth": 0}, {"key": "41002743", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884747059117, "ground_truth": 0}, {"key": "36322869", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.822189145527682, "ground_truth": 0}, {"key": "36322869", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8606036217494112, "ground_truth": 0}, {"key": "36322869", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7431680166686583, "ground_truth": 0}, {"key": "36322869", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916019322952, "ground_truth": 0}, {"key": "36322869", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527595369169, "ground_truth": 0}, {"key": "39459717", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.667147666723959, "ground_truth": 0}, {"key": "39459717", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6671476855517103, "ground_truth": 0}, {"key": "39459717", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8596637520369707, "ground_truth": 0}, {"key": "39459717", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581044604824, "ground_truth": 0}, {"key": "39459717", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382014581194, "ground_truth": 0}, {"key": "36503727", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2991051843916357, "ground_truth": 0}, {"key": "36503727", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38491212047494605, "ground_truth": 0}, {"key": "36503727", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43782351313315876, "ground_truth": 0}, {"key": "36503727", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324843929307, "ground_truth": 0}, {"key": "36503727", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984676289766, "ground_truth": 0}, {"key": "35682367", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7648915982608593, "ground_truth": 0}, {"key": "35682367", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8824278649957247, "ground_truth": 0}, {"key": "35682367", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7969253708913405, "ground_truth": 0}, {"key": "35682367", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884711062007, "ground_truth": 0}, {"key": "35682367", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253830700566, "ground_truth": 0}, {"key": "36472353", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6654105705358826, "ground_truth": 0}, {"key": "36472353", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4590761419486325, "ground_truth": 0}, {"key": "36472353", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45132647942992205, "ground_truth": 0}, {"key": "36472353", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.39047582385326135, "ground_truth": 0}, {"key": "36472353", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645935287194, "ground_truth": 0}, {"key": "37651907", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6297745862413278, "ground_truth": 0}, {"key": "37651907", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4282333893927913, "ground_truth": 0}, {"key": "37651907", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5640984966284305, "ground_truth": 0}, {"key": "37651907", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621764883961867, "ground_truth": 0}, {"key": "37651907", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591390152167, "ground_truth": 0}, {"key": "36255476", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7634837632453455, "ground_truth": 0}, {"key": "36255476", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6636689282534031, "ground_truth": 0}, {"key": "36255476", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8175744762634397, "ground_truth": 0}, {"key": "36255476", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884455791636, "ground_truth": 0}, {"key": "36255476", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063843673693, "ground_truth": 0}, {"key": "37283518", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7943849641331296, "ground_truth": 0}, {"key": "37283518", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8344068810505457, "ground_truth": 0}, {"key": "37283518", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8519527822914631, "ground_truth": 0}, {"key": "37283518", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743571747748, "ground_truth": 0}, {"key": "37283518", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423171128284, "ground_truth": 0}, {"key": "34906785", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6095241859699765, "ground_truth": 0}, {"key": "34906785", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7248702851219447, "ground_truth": 0}, {"key": "34906785", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.618780442761213, "ground_truth": 0}, {"key": "34906785", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928936309937, "ground_truth": 0}, {"key": "34906785", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137162125826, "ground_truth": 0}, {"key": "34965328", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8221891267296181, "ground_truth": 0}, {"key": "34965328", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8799743698258384, "ground_truth": 0}, {"key": "34965328", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8140527966846209, "ground_truth": 0}, {"key": "34965328", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493361589509, "ground_truth": 0}, {"key": "34965328", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367849881289, "ground_truth": 0}, {"key": "38788440", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.23370636814303314, "ground_truth": 0}, {"key": "38788440", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.21866937796479172, "ground_truth": 0}, {"key": "38788440", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.22270014117183642, "ground_truth": 0}, {"key": "38788440", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28457598584128546, "ground_truth": 0}, {"key": "38788440", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37022540725898456, "ground_truth": 0}, {"key": "35046866", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8624675263249901, "ground_truth": 0}, {"key": "35046866", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8278281536603729, "ground_truth": 0}, {"key": "35046866", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8688267720617305, "ground_truth": 0}, {"key": "35046866", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619308047998, "ground_truth": 0}, {"key": "35046866", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473653133041, "ground_truth": 0}, {"key": "37629558", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4571367342795657, "ground_truth": 0}, {"key": "37629558", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.43206338644028813, "ground_truth": 0}, {"key": "37629558", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5331543971719057, "ground_truth": 0}, {"key": "37629558", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3830641708228863, "ground_truth": 0}, {"key": "37629558", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451307335455, "ground_truth": 0}, {"key": "33859914", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.654894704870378, "ground_truth": 0}, {"key": "33859914", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7634837666759704, "ground_truth": 0}, {"key": "33859914", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8459424454560133, "ground_truth": 0}, {"key": "33859914", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122170570785, "ground_truth": 0}, {"key": "33859914", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059389443555, "ground_truth": 0}, {"key": "39790523", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8749346228430727, "ground_truth": 0}, {"key": "39790523", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8289388173132632, "ground_truth": 0}, {"key": "39790523", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8918110456294358, "ground_truth": 0}, {"key": "39790523", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256622294661, "ground_truth": 0}, {"key": "39790523", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755723404234, "ground_truth": 0}, {"key": "33509656", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5389832124556184, "ground_truth": 0}, {"key": "33509656", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6757645931689142, "ground_truth": 0}, {"key": "33509656", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4785288423404128, "ground_truth": 0}, {"key": "33509656", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984683274829, "ground_truth": 0}, {"key": "33509656", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882833967770946, "ground_truth": 0}, {"key": "17380923", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7620701038304803, "ground_truth": 0}, {"key": "17380923", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7074047136689523, "ground_truth": 0}, {"key": "17380923", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8128673113617279, "ground_truth": 0}, {"key": "17380923", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894520115196, "ground_truth": 0}, {"key": "17380923", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972727712039, "ground_truth": 0}, {"key": "36202526", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5621764894048783, "ground_truth": 0}, {"key": "36202526", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6513548702811582, "ground_truth": 0}, {"key": "36202526", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3867634471856283, "ground_truth": 0}, {"key": "36202526", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916052854013, "ground_truth": 0}, {"key": "36202526", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270139305141, "ground_truth": 0}, {"key": "26419232", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6859494442076961, "ground_truth": 0}, {"key": "26419232", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6352224392057569, "ground_truth": 0}, {"key": "26419232", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.57367839688482, "ground_truth": 0}, {"key": "26419232", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268346214172074, "ground_truth": 0}, {"key": "26419232", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762491883344, "ground_truth": 0}, {"key": "34232398", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6495786063420421, "ground_truth": 0}, {"key": "34232398", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7826624695738595, "ground_truth": 0}, {"key": "34232398", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6242935338371788, "ground_truth": 0}, {"key": "34232398", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512150655947, "ground_truth": 0}, {"key": "34232398", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228321188637, "ground_truth": 0}, {"key": "33586045", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7074046924936043, "ground_truth": 0}, {"key": "33586045", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8539127699568361, "ground_truth": 0}, {"key": "33586045", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6187804203799914, "ground_truth": 0}, {"key": "33586045", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324921100228, "ground_truth": 0}, {"key": "33586045", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583156796492, "ground_truth": 0}, {"key": "32281151", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5907792211932336, "ground_truth": 0}, {"key": "32281151", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45907612526703, "ground_truth": 0}, {"key": "32281151", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.41489886329957537, "ground_truth": 0}, {"key": "32281151", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804407833367, "ground_truth": 0}, {"key": "32281151", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548646660857, "ground_truth": 0}, {"key": "37308159", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9407897465064052, "ground_truth": 0}, {"key": "37308159", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8615382171379191, "ground_truth": 0}, {"key": "37308159", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359893784076, "ground_truth": 0}, {"key": "37308159", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.914900950591261, "ground_truth": 0}, {"key": "37308159", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869948346367, "ground_truth": 0}, {"key": "35694408", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7799929131817865, "ground_truth": 0}, {"key": "35694408", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9319595769353262, "ground_truth": 0}, {"key": "35694408", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7994423361804615, "ground_truth": 0}, {"key": "35694408", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281560251414, "ground_truth": 0}, {"key": "35694408", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786997938696, "ground_truth": 0}, {"key": "39781995", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4765796494383268, "ground_truth": 0}, {"key": "39781995", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5813030863080053, "ground_truth": 0}, {"key": "39781995", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4073334004221647, "ground_truth": 0}, {"key": "39781995", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937840377877335, "ground_truth": 0}, {"key": "39781995", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476739030432, "ground_truth": 0}, {"key": "22799372", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9268352780647762, "ground_truth": 0}, {"key": "22799372", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9511422219244764, "ground_truth": 0}, {"key": "22799372", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9429286000905659, "ground_truth": 0}, {"key": "22799372", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9726235095486211, "ground_truth": 0}, {"key": "22799372", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9412234427709462, "ground_truth": 0}, {"key": "37428240", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7505527506815185, "ground_truth": 0}, {"key": "37428240", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4765796513290152, "ground_truth": 0}, {"key": "37428240", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6825737147880531, "ground_truth": 0}, {"key": "37428240", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197656734794, "ground_truth": 0}, {"key": "37428240", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.629774634375965, "ground_truth": 0}, {"key": "40612657", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.966410493711053, "ground_truth": 0}, {"key": "40612657", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9830850887986924, "ground_truth": 0}, {"key": "40612657", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9473810479717873, "ground_truth": 0}, {"key": "40612657", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9618217237043394, "ground_truth": 0}, {"key": "40612657", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9746286906600069, "ground_truth": 0}, {"key": "34404662", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7786493242923577, "ground_truth": 0}, {"key": "34404662", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6477982167085852, "ground_truth": 0}, {"key": "34404662", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.785308563823313, "ground_truth": 0}, {"key": "34404662", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430410916514, "ground_truth": 0}, {"key": "34404662", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943901705331, "ground_truth": 0}, {"key": "32619704", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872000155767, "ground_truth": 0}, {"key": "32619704", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7025300445943606, "ground_truth": 0}, {"key": "32619704", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6926419740521438, "ground_truth": 0}, {"key": "32619704", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689437298787, "ground_truth": 0}, {"key": "32619704", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059568872106, "ground_truth": 0}, {"key": "39014883", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5736784072157372, "ground_truth": 0}, {"key": "39014883", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6566582716365432, "ground_truth": 0}, {"key": "39014883", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5660184981049843, "ground_truth": 0}, {"key": "39014883", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702646637871, "ground_truth": 0}, {"key": "39014883", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891301084079, "ground_truth": 0}, {"key": "37982812", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8596637481735105, "ground_truth": 0}, {"key": "37982812", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8509647017136229, "ground_truth": 0}, {"key": "37982812", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9167080707836218, "ground_truth": 0}, {"key": "37982812", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240866090259, "ground_truth": 0}, {"key": "37982812", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583414715132, "ground_truth": 0}, {"key": "28123476", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8856314759798912, "ground_truth": 0}, {"key": "28123476", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.824461928514344, "ground_truth": 0}, {"key": "28123476", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7799929025192942, "ground_truth": 0}, {"key": "28123476", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867696376784, "ground_truth": 0}, {"key": "28123476", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152325044857722, "ground_truth": 0}, {"key": "39078849", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6001883666065827, "ground_truth": 0}, {"key": "39078849", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238688192706, "ground_truth": 0}, {"key": "39078849", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7718434869072364, "ground_truth": 0}, {"key": "39078849", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241560452238, "ground_truth": 0}, {"key": "39078849", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046825150406, "ground_truth": 0}, {"key": "39414137", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9651191135959196, "ground_truth": 0}, {"key": "39414137", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9465966750000557, "ground_truth": 0}, {"key": "39414137", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9433475687695688, "ground_truth": 0}, {"key": "39414137", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.945801274803701, "ground_truth": 0}, {"key": "39414137", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9609517057295763, "ground_truth": 0}, {"key": "37371354", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5888891103079638, "ground_truth": 0}, {"key": "37371354", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6442250964986901, "ground_truth": 0}, {"key": "37371354", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.41111085775583756, "ground_truth": 0}, {"key": "37371354", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640243247886, "ground_truth": 0}, {"key": "37371354", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333780038398, "ground_truth": 0}, {"key": "29497179", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8887588012066938, "ground_truth": 0}, {"key": "29497179", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7648916184197728, "ground_truth": 0}, {"key": "29497179", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9099069941596215, "ground_truth": 0}, {"key": "29497179", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933783369397, "ground_truth": 0}, {"key": "29497179", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110512433324, "ground_truth": 0}, {"key": "35908694", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9092645092334329, "ground_truth": 0}, {"key": "35908694", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9543079684927379, "ground_truth": 0}, {"key": "35908694", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8902942179703823, "ground_truth": 0}, {"key": "35908694", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675320640881, "ground_truth": 0}, {"key": "35908694", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9155072460803811, "ground_truth": 0}, {"key": "37619358", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201715063553512, "ground_truth": 0}, {"key": "37619358", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8031737984538974, "ground_truth": 0}, {"key": "37619358", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6406358709777374, "ground_truth": 0}, {"key": "37619358", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299701585972, "ground_truth": 0}, {"key": "37619358", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879063571381124, "ground_truth": 0}, {"key": "37293103", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8175744775887127, "ground_truth": 0}, {"key": "37293103", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7106282844533408, "ground_truth": 0}, {"key": "37293103", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.889528845819249, "ground_truth": 0}, {"key": "37293103", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343730710409, "ground_truth": 0}, {"key": "37293103", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357623619731, "ground_truth": 0}, {"key": "36883729", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4902356298234713, "ground_truth": 0}, {"key": "36883729", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5428632739226839, "ground_truth": 0}, {"key": "36883729", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42441196916750124, "ground_truth": 0}, {"key": "36883729", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786968069083, "ground_truth": 0}, {"key": "36883729", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633104399794855, "ground_truth": 0}, {"key": "39209521", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7905303385587793, "ground_truth": 0}, {"key": "39209521", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.661922863561188, "ground_truth": 0}, {"key": "39209521", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7853085709826312, "ground_truth": 0}, {"key": "39209521", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149595248484, "ground_truth": 0}, {"key": "39209521", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148322497361, "ground_truth": 0}, {"key": "27792571", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7401743841768248, "ground_truth": 0}, {"key": "27792571", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7718435015867452, "ground_truth": 0}, {"key": "27792571", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5717666132413146, "ground_truth": 0}, {"key": "27792571", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942012002615, "ground_truth": 0}, {"key": "27792571", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.824461903925557, "ground_truth": 0}, {"key": "39755647", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7217432265079009, "ground_truth": 0}, {"key": "39755647", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7520125828342872, "ground_truth": 0}, {"key": "39755647", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7008948215407643, "ground_truth": 0}, {"key": "39755647", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743689561028, "ground_truth": 0}, {"key": "39755647", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740443113393, "ground_truth": 0}, {"key": "40800537", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.10970577536019158, "ground_truth": 0}, {"key": "40800537", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41489885013628236, "ground_truth": 0}, {"key": "40800537", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1766715807856765, "ground_truth": 0}, {"key": "40800537", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28616924463511206, "ground_truth": 0}, {"key": "40800537", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.35042136032295285, "ground_truth": 0}, {"key": "14171461", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6150878815023595, "ground_truth": 0}, {"key": "14171461", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6654105806514122, "ground_truth": 0}, {"key": "14171461", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6876299892102086, "ground_truth": 0}, {"key": "14171461", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435003923746, "ground_truth": 0}, {"key": "14171461", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833956707111, "ground_truth": 0}, {"key": "36892440", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3208212906302276, "ground_truth": 0}, {"key": "36892440", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2766905103718321, "ground_truth": 0}, {"key": "36892440", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5467381262507205, "ground_truth": 0}, {"key": "36892440", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.644225100316, "ground_truth": 0}, {"key": "36892440", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282334033902824, "ground_truth": 0}, {"key": "33733410", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8529354805310586, "ground_truth": 0}, {"key": "33733410", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6926419882197722, "ground_truth": 0}, {"key": "33733410", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7170118793179736, "ground_truth": 0}, {"key": "33733410", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195301105544, "ground_truth": 0}, {"key": "33733410", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210624305093, "ground_truth": 0}, {"key": "38587765", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.1571368493484776, "ground_truth": 0}, {"key": "38587765", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1732882062776068, "ground_truth": 0}, {"key": "38587765", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6242935459459465, "ground_truth": 0}, {"key": "38587765", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713269329725069, "ground_truth": 0}, {"key": "38587765", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808591635256, "ground_truth": 0}, {"key": "41065582", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.40168784245635836, "ground_truth": 0}, {"key": "41065582", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1460872493487828, "ground_truth": 0}, {"key": "41065582", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4785288530487944, "ground_truth": 0}, {"key": "41065582", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551985914372505, "ground_truth": 0}, {"key": "41065582", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101675424972205, "ground_truth": 0}, {"key": "34713891", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.09534946632958384, "ground_truth": 0}, {"key": "34713891", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22270013810099296, "ground_truth": 0}, {"key": "34713891", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46490155478802375, "ground_truth": 0}, {"key": "34713891", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495266215209, "ground_truth": 0}, {"key": "34713891", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069233470223, "ground_truth": 0}, {"key": "18913023", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8940517187434902, "ground_truth": 0}, {"key": "18913023", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9268352824052214, "ground_truth": 0}, {"key": "18913023", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9449947168668935, "ground_truth": 0}, {"key": "18913023", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.837619974314004, "ground_truth": 0}, {"key": "18913023", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352809169962, "ground_truth": 0}, {"key": "36884100", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.33807711761274034, "ground_truth": 0}, {"key": "36884100", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4571367200859188, "ground_truth": 0}, {"key": "36884100", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.13477592137518632, "ground_truth": 0}, {"key": "36884100", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111973973072434, "ground_truth": 0}, {"key": "36884100", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.13386748653456637, "ground_truth": 0}, {"key": "39899913", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8679338367524851, "ground_truth": 0}, {"key": "39899913", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7416740194864807, "ground_truth": 0}, {"key": "39899913", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359869830952, "ground_truth": 0}, {"key": "39899913", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970847823396, "ground_truth": 0}, {"key": "39899913", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637462162562, "ground_truth": 0}, {"key": "30725366", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.021450730780767934, "ground_truth": 0}, {"key": "30725366", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.17895590102561676, "ground_truth": 0}, {"key": "30725366", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.05184546991155868, "ground_truth": 0}, {"key": "30725366", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.05340332970934304, "ground_truth": 0}, {"key": "30725366", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.059210253667324804, "ground_truth": 0}, {"key": "26133523", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5602526511150775, "ground_truth": 0}, {"key": "26133523", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45713671678304724, "ground_truth": 0}, {"key": "26133523", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6531269140801003, "ground_truth": 0}, {"key": "26133523", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011555612335, "ground_truth": 0}, {"key": "26133523", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089094763324, "ground_truth": 0}, {"key": "29332665", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7534666546252066, "ground_truth": 0}, {"key": "29332665", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8558511531405453, "ground_truth": 0}, {"key": "29332665", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7772998758968566, "ground_truth": 0}, {"key": "29332665", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593265614737, "ground_truth": 0}, {"key": "29332665", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744785684416, "ground_truth": 0}, {"key": "37400481", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7853085926734199, "ground_truth": 0}, {"key": "37400481", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9284088052170639, "ground_truth": 0}, {"key": "37400481", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9263037320085319, "ground_truth": 0}, {"key": "37400481", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894568420084, "ground_truth": 0}, {"key": "37400481", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.875786991429717, "ground_truth": 0}, {"key": "38787241", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5253688549885672, "ground_truth": 0}, {"key": "38787241", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4378234878406342, "ground_truth": 0}, {"key": "38787241", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6424324449064436, "ground_truth": 0}, {"key": "38787241", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740324122323, "ground_truth": 0}, {"key": "38787241", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633732037696, "ground_truth": 0}, {"key": "38225963", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5428632717577755, "ground_truth": 0}, {"key": "38225963", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8221891308235747, "ground_truth": 0}, {"key": "38225963", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7154240111830639, "ground_truth": 0}, {"key": "38225963", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933486021667, "ground_truth": 0}, {"key": "38225963", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269345448889, "ground_truth": 0}, {"key": "26072034", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.16026603469490258, "ground_truth": 0}, {"key": "26072034", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1320661513932486, "ground_truth": 0}, {"key": "26072034", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.24653333858609142, "ground_truth": 0}, {"key": "26072034", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.14804719116831988, "ground_truth": 0}, {"key": "26072034", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.12678516978485202, "ground_truth": 0}, {"key": "35690810", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201715034275923, "ground_truth": 0}, {"key": "35690810", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8267117954873094, "ground_truth": 0}, {"key": "35690810", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9219218408285194, "ground_truth": 0}, {"key": "35690810", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339691576364, "ground_truth": 0}, {"key": "35690810", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366610310199, "ground_truth": 0}, {"key": "36855665", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9874720675731323, "ground_truth": 0}, {"key": "36855665", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.984093608426523, "ground_truth": 0}, {"key": "36855665", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9522199323322044, "ground_truth": 0}, {"key": "36855665", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.916708089497197, "ground_truth": 0}, {"key": "36855665", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9294404095918538, "ground_truth": 0}, {"key": "29757662", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.46101678497060483, "ground_truth": 0}, {"key": "29757662", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5964331594810924, "ground_truth": 0}, {"key": "29757662", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6095241791993368, "ground_truth": 0}, {"key": "29757662", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46295860672483496, "ground_truth": 0}, {"key": "29757662", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061679149154, "ground_truth": 0}, {"key": "19134339", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7549149886122425, "ground_truth": 0}, {"key": "19134339", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.58510116613968, "ground_truth": 0}, {"key": "19134339", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494652821113, "ground_truth": 0}, {"key": "19134339", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336918399363, "ground_truth": 0}, {"key": "19134339", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494445236669, "ground_truth": 0}, {"key": "35360732", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9118099611834879, "ground_truth": 0}, {"key": "35360732", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8376199690171937, "ground_truth": 0}, {"key": "35360732", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9053223048225509, "ground_truth": 0}, {"key": "35360732", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549534672358, "ground_truth": 0}, {"key": "35360732", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366584901979, "ground_truth": 0}, {"key": "37713629", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4707366285779368, "ground_truth": 0}, {"key": "37713629", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.642432466518375, "ground_truth": 0}, {"key": "37713629", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.47268347623478696, "ground_truth": 0}, {"key": "37713629", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551986073686939, "ground_truth": 0}, {"key": "37713629", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473268479565, "ground_truth": 0}, {"key": "33393394", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7606506615078649, "ground_truth": 0}, {"key": "33393394", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7057850026416913, "ground_truth": 0}, {"key": "33393394", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6566582921991967, "ground_truth": 0}, {"key": "33393394", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448014184427917, "ground_truth": 0}, {"key": "33393394", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324685655581, "ground_truth": 0}, {"key": "32275837", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8872045913251878, "ground_truth": 0}, {"key": "32275837", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9348724523064208, "ground_truth": 0}, {"key": "32275837", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9343951591685972, "ground_truth": 0}, {"key": "32275837", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434928963636, "ground_truth": 0}, {"key": "32275837", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919929083058, "ground_truth": 0}, {"key": "21458094", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5486735004985495, "ground_truth": 0}, {"key": "21458094", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35220180344505525, "ground_truth": 0}, {"key": "21458094", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5409238715159246, "ground_truth": 0}, {"key": "21458094", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740240893404, "ground_truth": 0}, {"key": "21458094", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317045263213, "ground_truth": 0}, {"key": "40975362", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6992544084839504, "ground_truth": 0}, {"key": "40975362", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7008948164221119, "ground_truth": 0}, {"key": "40975362", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.851952812888262, "ground_truth": 0}, {"key": "40975362", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159559744598, "ground_truth": 0}, {"key": "40975362", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.815232492710537, "ground_truth": 0}, {"key": "35234201", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7839884562996992, "ground_truth": 0}, {"key": "35234201", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6909762934132214, "ground_truth": 0}, {"key": "35234201", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6352224420064245, "ground_truth": 0}, {"key": "35234201", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318033591405, "ground_truth": 0}, {"key": "35234201", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397404218882, "ground_truth": 0}, {"key": "36037573", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8529354784042931, "ground_truth": 0}, {"key": "36037573", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8509647113591575, "ground_truth": 0}, {"key": "36037573", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7786493027788443, "ground_truth": 0}, {"key": "36037573", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333246042160045, "ground_truth": 0}, {"key": "36037573", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.81873678015661, "ground_truth": 0}, {"key": "30861915", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8624675250390631, "ground_truth": 0}, {"key": "30861915", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8140527923626873, "ground_truth": 0}, {"key": "30861915", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8799743788844505, "ground_truth": 0}, {"key": "30861915", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359869348468, "ground_truth": 0}, {"key": "30861915", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467676174372, "ground_truth": 0}, {"key": "40173012", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5370413476342776, "ground_truth": 0}, {"key": "40173012", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2909808569590362, "ground_truth": 0}, {"key": "40173012", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2553436746169757, "ground_truth": 0}, {"key": "40173012", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.24220561785881656, "ground_truth": 0}, {"key": "40173012", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.27202454678632904, "ground_truth": 0}, {"key": "35100330", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5774953994683916, "ground_truth": 0}, {"key": "35100330", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5428632757292596, "ground_truth": 0}, {"key": "35100330", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3793783866470372, "ground_truth": 0}, {"key": "35100330", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832122697713, "ground_truth": 0}, {"key": "35100330", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974734921611, "ground_truth": 0}, {"key": "37220221", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9155072510921276, "ground_truth": 0}, {"key": "37220221", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9372107917916147, "ground_truth": 0}, {"key": "37220221", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8757869829883457, "ground_truth": 0}, {"key": "37220221", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278673733138, "ground_truth": 0}, {"key": "37220221", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9403530555266054, "ground_truth": 0}, {"key": "38815218", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9026096035346631, "ground_truth": 0}, {"key": "38815218", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8925625201906873, "ground_truth": 0}, {"key": "38815218", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7918210733723767, "ground_truth": 0}, {"key": "38815218", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.909264509721023, "ground_truth": 0}, {"key": "38815218", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9618217279429068, "ground_truth": 0}, {"key": "39379109", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5331544095042897, "ground_truth": 0}, {"key": "39379109", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2583259713568003, "ground_truth": 0}, {"key": "39379109", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2704802161456019, "ground_truth": 0}, {"key": "39379109", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269726097333, "ground_truth": 0}, {"key": "39379109", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33111973304251435, "ground_truth": 0}, {"key": "14576125", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.13846179223241856, "ground_truth": 0}, {"key": "14576125", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.13206616534419452, "ground_truth": 0}, {"key": "14576125", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.0660853785927374, "ground_truth": 0}, {"key": "14576125", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.12592277106431995, "ground_truth": 0}, {"key": "14576125", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.07004895950241324, "ground_truth": 0}, {"key": "40814250", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9155072515624723, "ground_truth": 0}, {"key": "40814250", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8428631311728286, "ground_truth": 0}, {"key": "40814250", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8840392855150673, "ground_truth": 0}, {"key": "40814250", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9329437126951039, "ground_truth": 0}, {"key": "40814250", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.884039284196965, "ground_truth": 0}, {"key": "36334488", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39420093434568504, "ground_truth": 0}, {"key": "36334488", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2323101379312986, "ground_truth": 0}, {"key": "36334488", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.37937837694005466, "ground_truth": 0}, {"key": "36334488", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748908501961, "ground_truth": 0}, {"key": "36334488", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834742012467, "ground_truth": 0}, {"key": "36888322", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6791786914799822, "ground_truth": 0}, {"key": "36888322", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3575675127410549, "ground_truth": 0}, {"key": "36888322", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42823337573364356, "ground_truth": 0}, {"key": "36888322", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.554470478441528, "ground_truth": 0}, {"key": "36888322", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591286950833, "ground_truth": 0}, {"key": "37318916", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9314625097801168, "ground_truth": 0}, {"key": "37318916", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.936284998731502, "ground_truth": 0}, {"key": "37318916", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.936749475160612, "ground_truth": 0}, {"key": "37318916", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519527988222, "ground_truth": 0}, {"key": "37318916", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.913058342487361, "ground_truth": 0}, {"key": "39308700", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.29746992978086356, "ground_truth": 0}, {"key": "39308700", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5350984177323924, "ground_truth": 0}, {"key": "39308700", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5563995698439104, "ground_truth": 0}, {"key": "39308700", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298811386660705, "ground_truth": 0}, {"key": "39308700", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.278256799871242, "ground_truth": 0}, {"key": "31061543", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6584174885422075, "ground_truth": 0}, {"key": "31061543", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8344068901630957, "ground_truth": 0}, {"key": "31061543", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6926419956969272, "ground_truth": 0}, {"key": "31061543", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072466476519, "ground_truth": 0}, {"key": "31061543", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867775690161, "ground_truth": 0}, {"key": "37380894", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7025300484471271, "ground_truth": 0}, {"key": "37380894", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8998277723839728, "ground_truth": 0}, {"key": "37380894", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.868826781269611, "ground_truth": 0}, {"key": "37380894", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837585879248, "ground_truth": 0}, {"key": "37380894", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382097730399, "ground_truth": 0}, {"key": "38410139", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.40922077854679256, "ground_truth": 0}, {"key": "38410139", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3665897448311154, "ground_truth": 0}, {"key": "38410139", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.680878593617589, "ground_truth": 0}, {"key": "38410139", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891238801123, "ground_truth": 0}, {"key": "38410139", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998459103199, "ground_truth": 0}, {"key": "35953842", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.687629978119212, "ground_truth": 0}, {"key": "35953842", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7969253893783335, "ground_truth": 0}, {"key": "35953842", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7341195388644746, "ground_truth": 0}, {"key": "35953842", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666732252778, "ground_truth": 0}, {"key": "35953842", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647888663325, "ground_truth": 0}, {"key": "39815663", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2909808520404419, "ground_truth": 0}, {"key": "39815663", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.0726367080458683, "ground_truth": 0}, {"key": "39815663", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1441488498218707, "ground_truth": 0}, {"key": "39815663", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.07004896634157325, "ground_truth": 0}, {"key": "39815663", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733752209774865, "ground_truth": 0}, {"key": "35121432", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9343951626897018, "ground_truth": 0}, {"key": "35121432", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9079671370742404, "ground_truth": 0}, {"key": "35121432", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.867035765364353, "ground_truth": 0}, {"key": "35121432", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721936709387, "ground_truth": 0}, {"key": "35121432", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382173936827, "ground_truth": 0}, {"key": "21712310", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.25683200593923666, "ground_truth": 0}, {"key": "21712310", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47268345230203324, "ground_truth": 0}, {"key": "21712310", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3557748809788445, "ground_truth": 0}, {"key": "21712310", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4186968951637967, "ground_truth": 0}, {"key": "21712310", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311872203513, "ground_truth": 0}, {"key": "37952914", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8723473808321293, "ground_truth": 0}, {"key": "37952914", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.789233696504231, "ground_truth": 0}, {"key": "37952914", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8596637441660987, "ground_truth": 0}, {"key": "37952914", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666387743162, "ground_truth": 0}, {"key": "37952914", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437635191213, "ground_truth": 0}, {"key": "38956779", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6774740208630481, "ground_truth": 0}, {"key": "38956779", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.36658975783230385, "ground_truth": 0}, {"key": "38956779", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.41679662732435463, "ground_truth": 0}, {"key": "38956779", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233684411753605, "ground_truth": 0}, {"key": "38956779", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3684056933116001, "ground_truth": 0}, {"key": "36101833", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.62795121246975, "ground_truth": 0}, {"key": "36101833", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5467381723945283, "ground_truth": 0}, {"key": "36101833", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7563575700431167, "ground_truth": 0}, {"key": "36101833", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786954236562, "ground_truth": 0}, {"key": "36101833", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121665301139, "ground_truth": 0}, {"key": "35544662", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6636689629028832, "ground_truth": 0}, {"key": "35544662", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37022541669966635, "ground_truth": 0}, {"key": "35544662", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8044059206588868, "ground_truth": 0}, {"key": "35544662", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388088745764, "ground_truth": 0}, {"key": "35544662", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872289976503, "ground_truth": 0}, {"key": "39759044", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3468730949517381, "ground_truth": 0}, {"key": "39759044", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3023910884406539, "ground_truth": 0}, {"key": "39759044", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36477758011437655, "ground_truth": 0}, {"key": "39759044", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298811453887557, "ground_truth": 0}, {"key": "39759044", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.22270014475678823, "ground_truth": 0}, {"key": "39433018", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.920217986339338, "ground_truth": 0}, {"key": "39433018", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9124361617875645, "ground_truth": 0}, {"key": "39433018", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8428631506190503, "ground_truth": 0}, {"key": "39433018", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122192350133, "ground_truth": 0}, {"key": "39433018", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036193223443, "ground_truth": 0}, {"key": "22111959", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4863315195164977, "ground_truth": 0}, {"key": "22111959", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.476579659771756, "ground_truth": 0}, {"key": "22111959", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5292633815346491, "ground_truth": 0}, {"key": "22111959", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591061133405, "ground_truth": 0}, {"key": "22111959", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715157672126, "ground_truth": 0}, {"key": "38210094", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5117165900973107, "ground_truth": 0}, {"key": "38210094", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3904758178635347, "ground_truth": 0}, {"key": "38210094", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6169358339591517, "ground_truth": 0}, {"key": "38210094", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262572099265, "ground_truth": 0}, {"key": "38210094", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213306865378, "ground_truth": 0}, {"key": "37675935", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3415825031219073, "ground_truth": 0}, {"key": "37675935", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41489883068917305, "ground_truth": 0}, {"key": "37675935", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4610167786866434, "ground_truth": 0}, {"key": "37675935", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591335385909, "ground_truth": 0}, {"key": "37675935", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306414983747455, "ground_truth": 0}, {"key": "35732604", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2974699560344537, "ground_truth": 0}, {"key": "35732604", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3757064764379062, "ground_truth": 0}, {"key": "35732604", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.0960254947269443, "ground_truth": 0}, {"key": "35732604", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28140562340642455, "ground_truth": 0}, {"key": "35732604", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713685792863796, "ground_truth": 0}, {"key": "27453212", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6825737491038258, "ground_truth": 0}, {"key": "27453212", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6370307993472959, "ground_truth": 0}, {"key": "27453212", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837595026278, "ground_truth": 0}, {"key": "27453212", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942896376389, "ground_truth": 0}, {"key": "27453212", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284077790981, "ground_truth": 0}, {"key": "39910047", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5888891469764583, "ground_truth": 0}, {"key": "39910047", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6150878434332566, "ground_truth": 0}, {"key": "39910047", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5869964311554695, "ground_truth": 0}, {"key": "39910047", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.58130307103265, "ground_truth": 0}, {"key": "39910047", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802504470491, "ground_truth": 0}, {"key": "40054265", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947195614774, "ground_truth": 0}, {"key": "40054265", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4960938392035059, "ground_truth": 0}, {"key": "40054265", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4629586181243648, "ground_truth": 0}, {"key": "40054265", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684560558964594, "ground_truth": 0}, {"key": "40054265", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356686431859534, "ground_truth": 0}, {"key": "19984615", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4130035666110496, "ground_truth": 0}, {"key": "19984615", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6132365260185331, "ground_truth": 0}, {"key": "19984615", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44939264437003584, "ground_truth": 0}, {"key": "19984615", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679664295186, "ground_truth": 0}, {"key": "19984615", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1470645248933995, "ground_truth": 0}, {"key": "16490806", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4436004131009491, "ground_truth": 0}, {"key": "16490806", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.527316528508648, "ground_truth": 0}, {"key": "16490806", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3923368073450471, "ground_truth": 0}, {"key": "16490806", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937169907596166, "ground_truth": 0}, {"key": "16490806", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073658866181506, "ground_truth": 0}, {"key": "36396237", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9618217265341619, "ground_truth": 0}, {"key": "36396237", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9637799457509324, "ground_truth": 0}, {"key": "36396237", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9640516797433172, "ground_truth": 0}, {"key": "36396237", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9433475760683484, "ground_truth": 0}, {"key": "36396237", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876974703294, "ground_truth": 0}, {"key": "40726444", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4921881383280728, "ground_truth": 0}, {"key": "40726444", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48633153900485443, "ground_truth": 0}, {"key": "40726444", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.509764401001618, "ground_truth": 0}, {"key": "40726444", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526501357608, "ground_truth": 0}, {"key": "40726444", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526563864469, "ground_truth": 0}, {"key": "37314826", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2628418503240232, "ground_truth": 0}, {"key": "37314826", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.17328821422903695, "ground_truth": 0}, {"key": "37314826", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4282334094076309, "ground_truth": 0}, {"key": "37314826", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796486313837, "ground_truth": 0}, {"key": "37314826", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3867634763522174, "ground_truth": 0}, {"key": "38506971", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4282334095404487, "ground_truth": 0}, {"key": "38506971", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5350984339296204, "ground_truth": 0}, {"key": "38506971", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6424324895708167, "ground_truth": 0}, {"key": "38506971", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.32082128643969804, "ground_truth": 0}, {"key": "38506971", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.19436779243068963, "ground_truth": 0}, {"key": "40699312", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7620701143822448, "ground_truth": 0}, {"key": "40699312", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9334308108760636, "ground_truth": 0}, {"key": "40699312", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8740772288114064, "ground_truth": 0}, {"key": "40699312", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920226162995, "ground_truth": 0}, {"key": "40699312", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802822434576, "ground_truth": 0}, {"key": "34695474", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7341195584471768, "ground_truth": 0}, {"key": "34695474", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512464740719, "ground_truth": 0}, {"key": "34695474", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432100328358, "ground_truth": 0}, {"key": "34695474", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813031035226139, "ground_truth": 0}, {"key": "34695474", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.658417504248862, "ground_truth": 0}, {"key": "36281498", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8679338360154065, "ground_truth": 0}, {"key": "36281498", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8322366499557357, "ground_truth": 0}, {"key": "36281498", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7994423082494809, "ground_truth": 0}, {"key": "36281498", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264255937793234, "ground_truth": 0}, {"key": "36281498", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321855238103, "ground_truth": 0}, {"key": "39558652", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3433417204922797, "ground_truth": 0}, {"key": "39558652", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.43782350538728076, "ground_truth": 0}, {"key": "39558652", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6706082770607443, "ground_truth": 0}, {"key": "39558652", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254023114944, "ground_truth": 0}, {"key": "39558652", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.689305641594213, "ground_truth": 0}, {"key": "37330579", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4397473557967899, "ground_truth": 0}, {"key": "37330579", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.23231014137110415, "ground_truth": 0}, {"key": "37330579", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.27357439971875513, "ground_truth": 0}, {"key": "37330579", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398630833295097, "ground_truth": 0}, {"key": "37330579", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300354651443605, "ground_truth": 0}, {"key": "40547658", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5467381328916968, "ground_truth": 0}, {"key": "40547658", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.638835274935215, "ground_truth": 0}, {"key": "40547658", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5774953634248475, "ground_truth": 0}, {"key": "40547658", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.734119509806549, "ground_truth": 0}, {"key": "40547658", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307655370175, "ground_truth": 0}, {"key": "37119340", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3979384005673774, "ground_truth": 0}, {"key": "37119340", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.43014735120587627, "ground_truth": 0}, {"key": "37119340", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4882833833053754, "ground_truth": 0}, {"key": "37119340", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476666905067, "ground_truth": 0}, {"key": "37119340", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368063582311, "ground_truth": 0}, {"key": "35301627", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5136684688295775, "ground_truth": 0}, {"key": "35301627", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.33633106195156737, "ground_truth": 0}, {"key": "35301627", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6206215994647004, "ground_truth": 0}, {"key": "35301627", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307597369443, "ground_truth": 0}, {"key": "35301627", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909763171808286, "ground_truth": 0}, {"key": "34037168", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.29259529165546655, "ground_truth": 0}, {"key": "34037168", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3023910896056184, "ground_truth": 0}, {"key": "34037168", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.29583987951355034, "ground_truth": 0}, {"key": "34037168", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700051814956, "ground_truth": 0}, {"key": "34037168", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606817683486, "ground_truth": 0}, {"key": "39703862", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9224823395488841, "ground_truth": 0}, {"key": "39703862", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9319595767653175, "ground_truth": 0}, {"key": "39703862", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9184802475251473, "ground_truth": 0}, {"key": "39703862", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9213576154139168, "ground_truth": 0}, {"key": "39703862", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107869813836, "ground_truth": 0}, {"key": "16554814", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6370307782459118, "ground_truth": 0}, {"key": "16554814", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.656658276597114, "ground_truth": 0}, {"key": "16554814", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7310585921052409, "ground_truth": 0}, {"key": "16554814", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943790994498, "ground_truth": 0}, {"key": "16554814", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689531717088, "ground_truth": 0}, {"key": "32983099", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.13660839721195858, "ground_truth": 0}, {"key": "32983099", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.08945459934293774, "ground_truth": 0}, {"key": "32983099", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2309197603323016, "ground_truth": 0}, {"key": "32983099", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295436701189, "ground_truth": 0}, {"key": "32983099", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573596780314345, "ground_truth": 0}, {"key": "41072994", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3923368410224353, "ground_truth": 0}, {"key": "41072994", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47657965689186477, "ground_truth": 0}, {"key": "41072994", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2436424318856777, "ground_truth": 0}, {"key": "41072994", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.38121955322737316, "ground_truth": 0}, {"key": "41072994", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.26133092423816245, "ground_truth": 0}, {"key": "38396247", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.865224098279274, "ground_truth": 0}, {"key": "38396247", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8740772273984004, "ground_truth": 0}, {"key": "38396247", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9073122200015001, "ground_truth": 0}, {"key": "38396247", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281644528002, "ground_truth": 0}, {"key": "38396247", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9640516749740915, "ground_truth": 0}, {"key": "37507998", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6619228724080234, "ground_truth": 0}, {"key": "37507998", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5813031007756089, "ground_truth": 0}, {"key": "37507998", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8449215356729138, "ground_truth": 0}, {"key": "37507998", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073958711011, "ground_truth": 0}, {"key": "37507998", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118811926988, "ground_truth": 0}, {"key": "32593929", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37204876123210223, "ground_truth": 0}, {"key": "32593929", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5717665941445543, "ground_truth": 0}, {"key": "32593929", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36477755891060165, "ground_truth": 0}, {"key": "32593929", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216483423619, "ground_truth": 0}, {"key": "32593929", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593411417293, "ground_truth": 0}, {"key": "36056449", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.519521321005014, "ground_truth": 0}, {"key": "36056449", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195502056942, "ground_truth": 0}, {"key": "36056449", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7931059328640235, "ground_truth": 0}, {"key": "36056449", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804230266759, "ground_truth": 0}, {"key": "36056449", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526500949822, "ground_truth": 0}, {"key": "21986185", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.1294027252823272, "ground_truth": 0}, {"key": "21986185", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1895210844563947, "ground_truth": 0}, {"key": "21986185", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.18594720251566904, "ground_truth": 0}, {"key": "21986185", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048023127074095, "ground_truth": 0}, {"key": "21986185", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1666754023587463, "ground_truth": 0}, {"key": "40757465", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6297745931058666, "ground_truth": 0}, {"key": "40757465", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5078118819221339, "ground_truth": 0}, {"key": "40757465", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5292633860289666, "ground_truth": 0}, {"key": "40757465", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.540923867222291, "ground_truth": 0}, {"key": "40757465", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852883931598117, "ground_truth": 0}, {"key": "35198313", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.45132651314705613, "ground_truth": 0}, {"key": "35198313", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4493926189458054, "ground_truth": 0}, {"key": "35198313", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5945512689432073, "ground_truth": 0}, {"key": "35198313", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009375086809, "ground_truth": 0}, {"key": "35198313", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224457459922, "ground_truth": 0}, {"key": "30604618", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201715139520941, "ground_truth": 0}, {"key": "30604618", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6352224406166076, "ground_truth": 0}, {"key": "30604618", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.839733970031373, "ground_truth": 0}, {"key": "30604618", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251175741446, "ground_truth": 0}, {"key": "30604618", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.660172402130251, "ground_truth": 0}, {"key": "35779006", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5736784120535782, "ground_truth": 0}, {"key": "35779006", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4765796598222728, "ground_truth": 0}, {"key": "35779006", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46879062867619664, "ground_truth": 0}, {"key": "35779006", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531642752301, "ground_truth": 0}, {"key": "35779006", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640066333082, "ground_truth": 0}, {"key": "33858956", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5175708821228159, "ground_truth": 0}, {"key": "33858956", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47852883905262955, "ground_truth": 0}, {"key": "33858956", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837686320074, "ground_truth": 0}, {"key": "33858956", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982496451121, "ground_truth": 0}, {"key": "33858956", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645700854256, "ground_truth": 0}, {"key": "38633880", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.35577490496334496, "ground_truth": 0}, {"key": "38633880", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2030746269934538, "ground_truth": 0}, {"key": "38633880", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.18713268389134527, "ground_truth": 0}, {"key": "38633880", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991052013911871, "ground_truth": 0}, {"key": "38633880", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982760695951875, "ground_truth": 0}, {"key": "36654905", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9832145120506103, "ground_truth": 0}, {"key": "36654905", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9912886153464666, "ground_truth": 0}, {"key": "36654905", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9763105265408623, "ground_truth": 0}, {"key": "36654905", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9465966686623956, "ground_truth": 0}, {"key": "36654905", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.957912270176493, "ground_truth": 0}, {"key": "26547482", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3979384464160314, "ground_truth": 0}, {"key": "26547482", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.20434190859577822, "ground_truth": 0}, {"key": "26547482", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40733340390620865, "ground_truth": 0}, {"key": "26547482", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995836780233, "ground_truth": 0}, {"key": "26547482", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37022537089155183, "ground_truth": 0}, {"key": "36439068", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201715217974579, "ground_truth": 0}, {"key": "36439068", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5136684518775402, "ground_truth": 0}, {"key": "36439068", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40733340785681743, "ground_truth": 0}, {"key": "36439068", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016877906158616, "ground_truth": 0}, {"key": "36439068", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814571516839, "ground_truth": 0}, {"key": "30501258", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5660185035010192, "ground_truth": 0}, {"key": "30501258", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8354835372760696, "ground_truth": 0}, {"key": "30501258", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5926665946276053, "ground_truth": 0}, {"key": "30501258", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891505993652, "ground_truth": 0}, {"key": "30501258", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.718594401230098, "ground_truth": 0}, {"key": "37560941", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.640635865858763, "ground_truth": 0}, {"key": "37560941", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8267117900512168, "ground_truth": 0}, {"key": "37560941", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46684559359824707, "ground_truth": 0}, {"key": "37560941", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587992404015, "ground_truth": 0}, {"key": "37560941", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306273034663, "ground_truth": 0}, {"key": "36801665", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8164063937930937, "ground_truth": 0}, {"key": "36801665", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8714748581802896, "ground_truth": 0}, {"key": "36801665", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7279754183404125, "ground_truth": 0}, {"key": "36801665", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942179246333, "ground_truth": 0}, {"key": "36801665", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.824461909338923, "ground_truth": 0}, {"key": "34954610", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3504213662105923, "ground_truth": 0}, {"key": "34954610", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3090236994504023, "ground_truth": 0}, {"key": "34954610", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.35042137966317405, "ground_truth": 0}, {"key": "34954610", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244119838006803, "ground_truth": 0}, {"key": "34954610", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413641839098, "ground_truth": 0}, {"key": "37020510", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7799929033972158, "ground_truth": 0}, {"key": "37020510", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6859494381353481, "ground_truth": 0}, {"key": "37020510", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6187804119966842, "ground_truth": 0}, {"key": "37020510", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367918646544, "ground_truth": 0}, {"key": "37020510", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303162160227, "ground_truth": 0}, {"key": "38064637", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.19072401651303522, "ground_truth": 0}, {"key": "38064637", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.12940272977738226, "ground_truth": 0}, {"key": "38064637", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.20946968269437694, "ground_truth": 0}, {"key": "38064637", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.27825679474647513, "ground_truth": 0}, {"key": "38064637", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667538758560937, "ground_truth": 0}, {"key": "40886108", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9458012692457187, "ground_truth": 0}, {"key": "40886108", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9594592612643891, "ground_truth": 0}, {"key": "40886108", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9385759527023175, "ground_truth": 0}, {"key": "40886108", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.934395157009016, "ground_truth": 0}, {"key": "40886108", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149042693782, "ground_truth": 0}, {"key": "38554603", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7476159543871297, "ground_truth": 0}, {"key": "38554603", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.789233693972401, "ground_truth": 0}, {"key": "38554603", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5736784047160295, "ground_truth": 0}, {"key": "38554603", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137142798527, "ground_truth": 0}, {"key": "38554603", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300631969315, "ground_truth": 0}, {"key": "39115586", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4397473100726564, "ground_truth": 0}, {"key": "39115586", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5019531392091217, "ground_truth": 0}, {"key": "39115586", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4707365951374156, "ground_truth": 0}, {"key": "39115586", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022540766792644, "ground_truth": 0}, {"key": "39115586", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.689305629943943, "ground_truth": 0}, {"key": "38786314", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.517570903566878, "ground_truth": 0}, {"key": "38786314", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.476579658799419, "ground_truth": 0}, {"key": "38786314", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7041601451204146, "ground_truth": 0}, {"key": "38786314", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118976138216, "ground_truth": 0}, {"key": "38786314", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802684954327, "ground_truth": 0}, {"key": "38721078", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8856314709924612, "ground_truth": 0}, {"key": "38721078", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8661325040091513, "ground_truth": 0}, {"key": "38721078", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9178933717350025, "ground_truth": 0}, {"key": "38721078", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952954135788, "ground_truth": 0}, {"key": "38721078", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215434781221, "ground_truth": 0}, {"key": "39475467", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.560252696445045, "ground_truth": 0}, {"key": "39475467", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37570647137898666, "ground_truth": 0}, {"key": "39475467", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7325918456255924, "ground_truth": 0}, {"key": "39475467", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657965131510177, "ground_truth": 0}, {"key": "39475467", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283120821232, "ground_truth": 0}, {"key": "35691234", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8233283947408241, "ground_truth": 0}, {"key": "35691234", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238818153977, "ground_truth": 0}, {"key": "35691234", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6352224531457632, "ground_truth": 0}, {"key": "35691234", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073606941909, "ground_truth": 0}, {"key": "35691234", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324753823601, "ground_truth": 0}, {"key": "36871390", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5525397041258132, "ground_truth": 0}, {"key": "36871390", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5428632914255114, "ground_truth": 0}, {"key": "36871390", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6388352594089001, "ground_truth": 0}, {"key": "36871390", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633157858313225, "ground_truth": 0}, {"key": "36871390", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175178534963, "ground_truth": 0}, {"key": "31730844", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5058591128347559, "ground_truth": 0}, {"key": "31730844", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.24508501317857523, "ground_truth": 0}, {"key": "31730844", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.37204878290404303, "ground_truth": 0}, {"key": "31730844", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.571766604304855, "ground_truth": 0}, {"key": "31730844", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893717152510823, "ground_truth": 0}, {"key": "30810940", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4320634041097933, "ground_truth": 0}, {"key": "30810940", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4863315435596838, "ground_truth": 0}, {"key": "30810940", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033631818064, "ground_truth": 0}, {"key": "30810940", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740109978773, "ground_truth": 0}, {"key": "30810940", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593393301667, "ground_truth": 0}, {"key": "39352003", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8840392962060005, "ground_truth": 0}, {"key": "39352003", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9252299593205303, "ground_truth": 0}, {"key": "39352003", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8732148273910554, "ground_truth": 0}, {"key": "39352003", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425316164977, "ground_truth": 0}, {"key": "39352003", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898095753334, "ground_truth": 0}, {"key": "40118123", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5907791930525632, "ground_truth": 0}, {"key": "40118123", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.629774610252431, "ground_truth": 0}, {"key": "40118123", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5679366115690447, "ground_truth": 0}, {"key": "40118123", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984852575891, "ground_truth": 0}, {"key": "40118123", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880399604223, "ground_truth": 0}, {"key": "37114191", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.41111090216689905, "ground_truth": 0}, {"key": "37114191", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5097643714482081, "ground_truth": 0}, {"key": "37114191", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6224593545073938, "ground_truth": 0}, {"key": "37114191", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132650440604005, "ground_truth": 0}, {"key": "37114191", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571366930991242, "ground_truth": 0}, {"key": "39268203", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702640751375, "ground_truth": 0}, {"key": "39268203", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7690802390226573, "ground_truth": 0}, {"key": "39268203", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.738669078775542, "ground_truth": 0}, {"key": "39268203", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689424468334, "ground_truth": 0}, {"key": "39268203", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.740174350727893, "ground_truth": 0}, {"key": "37950968", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5156199205880062, "ground_truth": 0}, {"key": "37950968", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5563995791998123, "ground_truth": 0}, {"key": "37950968", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.34158248451055695, "ground_truth": 0}, {"key": "37950968", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947297053889, "ground_truth": 0}, {"key": "37950968", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.34510526500275984, "ground_truth": 0}, {"key": "34959807", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6774740165097503, "ground_truth": 0}, {"key": "34959807", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.55253968166716, "ground_truth": 0}, {"key": "34959807", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7446563360907514, "ground_truth": 0}, {"key": "34959807", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544264012694, "ground_truth": 0}, {"key": "34959807", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424419283532, "ground_truth": 0}, {"key": "35631314", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8832359839280828, "ground_truth": 0}, {"key": "35631314", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7648916161101033, "ground_truth": 0}, {"key": "35631314", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8940517084671591, "ground_truth": 0}, {"key": "35631314", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9353465090540317, "ground_truth": 0}, {"key": "35631314", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620676262245, "ground_truth": 0}, {"key": "38082365", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8164063694297292, "ground_truth": 0}, {"key": "38082365", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9399133532866698, "ground_truth": 0}, {"key": "38082365", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7892336909299512, "ground_truth": 0}, {"key": "38082365", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274118584929, "ground_truth": 0}, {"key": "38082365", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748561245896, "ground_truth": 0}, {"key": "37242829", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5660185403508378, "ground_truth": 0}, {"key": "37242829", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5983121938876503, "ground_truth": 0}, {"key": "37242829", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3191213947676817, "ground_truth": 0}, {"key": "37242829", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064549812002, "ground_truth": 0}, {"key": "37242829", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220177482270615, "ground_truth": 0}, {"key": "38556068", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.33111973254457344, "ground_truth": 0}, {"key": "38556068", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5039061875188177, "ground_truth": 0}, {"key": "38556068", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6187804347326832, "ground_truth": 0}, {"key": "38556068", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713671254303945, "ground_truth": 0}, {"key": "38556068", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061876676095, "ground_truth": 0}, {"key": "32969336", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6601723624168193, "ground_truth": 0}, {"key": "32969336", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8596637459503615, "ground_truth": 0}, {"key": "32969336", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6774739863810654, "ground_truth": 0}, {"key": "32969336", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998670024619, "ground_truth": 0}, {"key": "32969336", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.566018538691664, "ground_truth": 0}, {"key": "36825153", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3191213742892288, "ground_truth": 0}, {"key": "36825153", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3665897149787922, "ground_truth": 0}, {"key": "36825153", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3830641676736548, "ground_truth": 0}, {"key": "36825153", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033624549229998, "ground_truth": 0}, {"key": "36825153", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519859123593076, "ground_truth": 0}, {"key": "41050146", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8643104635290837, "ground_truth": 0}, {"key": "41050146", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.863391598620658, "ground_truth": 0}, {"key": "41050146", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7074047143429993, "ground_truth": 0}, {"key": "41050146", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324834812567, "ground_truth": 0}, {"key": "41050146", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.795658093655913, "ground_truth": 0}, {"key": "27865037", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5774953491131583, "ground_truth": 0}, {"key": "27865037", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.27048019681891083, "ground_truth": 0}, {"key": "27865037", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.34334174904832293, "ground_truth": 0}, {"key": "27865037", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784196484583, "ground_truth": 0}, {"key": "27865037", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494467283253, "ground_truth": 0}, {"key": "39868565", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6757645954624703, "ground_truth": 0}, {"key": "39868565", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45713668330280405, "ground_truth": 0}, {"key": "39868565", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49609385113888077, "ground_truth": 0}, {"key": "39868565", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591176836199, "ground_truth": 0}, {"key": "39868565", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646021868958, "ground_truth": 0}, {"key": "37761968", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7264256033594011, "ground_truth": 0}, {"key": "37761968", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7201715296568995, "ground_truth": 0}, {"key": "37761968", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.699254409183613, "ground_truth": 0}, {"key": "37761968", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704648049436033, "ground_truth": 0}, {"key": "37761968", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389828451549, "ground_truth": 0}, {"key": "16326139", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.27048022717948855, "ground_truth": 0}, {"key": "16326139", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4339814586089067, "ground_truth": 0}, {"key": "16326139", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40922078739299067, "ground_truth": 0}, {"key": "16326139", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.314050550230239, "ground_truth": 0}, {"key": "16326139", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510836374626465, "ground_truth": 0}, {"key": "36568381", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7325918435524605, "ground_truth": 0}, {"key": "36568381", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.567936613454097, "ground_truth": 0}, {"key": "36568381", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8221891372316371, "ground_truth": 0}, {"key": "36568381", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918457715229, "ground_truth": 0}, {"key": "36568381", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898463542354, "ground_truth": 0}, {"key": "39855613", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7185944070700203, "ground_truth": 0}, {"key": "39855613", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8386797568826982, "ground_truth": 0}, {"key": "39855613", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9149009582163825, "ground_truth": 0}, {"key": "39855613", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199766906005, "ground_truth": 0}, {"key": "39855613", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085623845258, "ground_truth": 0}, {"key": "29856302", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4941409028717746, "ground_truth": 0}, {"key": "29856302", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6584175116192009, "ground_truth": 0}, {"key": "29856302", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4980468994735011, "ground_truth": 0}, {"key": "29856302", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711886683608, "ground_truth": 0}, {"key": "29856302", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633721392296, "ground_truth": 0}, {"key": "35641106", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7008948210243722, "ground_truth": 0}, {"key": "35641106", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6566582759286154, "ground_truth": 0}, {"key": "35641106", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6334102555041432, "ground_truth": 0}, {"key": "35641106", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.631594330181457, "ground_truth": 0}, {"key": "35641106", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575403174162, "ground_truth": 0}, {"key": "39474558", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3665897407505427, "ground_truth": 0}, {"key": "39474558", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39793841098142235, "ground_truth": 0}, {"key": "39474558", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42059956978853114, "ground_truth": 0}, {"key": "39474558", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819783689652, "ground_truth": 0}, {"key": "39474558", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241765725764, "ground_truth": 0}, {"key": "34338135", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7943849592661503, "ground_truth": 0}, {"key": "34338135", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8479677722669414, "ground_truth": 0}, {"key": "34338135", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8864204118716302, "ground_truth": 0}, {"key": "34338135", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772323499779, "ground_truth": 0}, {"key": "34338135", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511436951531, "ground_truth": 0}, {"key": "35870330", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6315943187061339, "ground_truth": 0}, {"key": "35870330", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8428631399765164, "ground_truth": 0}, {"key": "35870330", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8799743695634488, "ground_truth": 0}, {"key": "35870330", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210681131831, "ground_truth": 0}, {"key": "35870330", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321925960763, "ground_truth": 0}, {"key": "24478245", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8643104573463919, "ground_truth": 0}, {"key": "24478245", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256017398093, "ground_truth": 0}, {"key": "24478245", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.827828149407485, "ground_truth": 0}, {"key": "24478245", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.763483779983381, "ground_truth": 0}, {"key": "24478245", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513707660412, "ground_truth": 0}, {"key": "38485946", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7371581583149335, "ground_truth": 0}, {"key": "38485946", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4649015280095418, "ground_truth": 0}, {"key": "38485946", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5813031150427022, "ground_truth": 0}, {"key": "38485946", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872302257349, "ground_truth": 0}, {"key": "38485946", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102684595496, "ground_truth": 0}, {"key": "32509613", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8976952965120906, "ground_truth": 0}, {"key": "32509613", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8969755691053868, "ground_truth": 0}, {"key": "32509613", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8152324922638793, "ground_truth": 0}, {"key": "32509613", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104458994567, "ground_truth": 0}, {"key": "32509613", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528075770204, "ground_truth": 0}, {"key": "34078819", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8740772407610661, "ground_truth": 0}, {"key": "34078819", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6020615886489044, "ground_truth": 0}, {"key": "34078819", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9053223019236746, "ground_truth": 0}, {"key": "34078819", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.885631474842568, "ground_truth": 0}, {"key": "34078819", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754328058282, "ground_truth": 0}, {"key": "39523865", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6495786332286019, "ground_truth": 0}, {"key": "39523865", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.752012585922785, "ground_truth": 0}, {"key": "39523865", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477981931920904, "ground_truth": 0}, {"key": "39523865", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984743075899, "ground_truth": 0}, {"key": "39523865", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786747258897, "ground_truth": 0}, {"key": "33146158", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3451052530283459, "ground_truth": 0}, {"key": "33146158", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7577943830575664, "ground_truth": 0}, {"key": "33146158", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4649015376523981, "ground_truth": 0}, {"key": "33146158", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.345105275905698, "ground_truth": 0}, {"key": "33146158", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4902356193604411, "ground_truth": 0}, {"key": "32083974", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6531269352832987, "ground_truth": 0}, {"key": "32083974", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4571367268268026, "ground_truth": 0}, {"key": "32083974", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7279754646941661, "ground_truth": 0}, {"key": "32083974", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291333465652, "ground_truth": 0}, {"key": "32083974", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269396750419, "ground_truth": 0}, {"key": "34378482", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.95759617236013, "ground_truth": 0}, {"key": "34378482", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9553191276863597, "ground_truth": 0}, {"key": "34378482", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9309620778912846, "ground_truth": 0}, {"key": "34378482", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748579657758, "ground_truth": 0}, {"key": "34378482", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823488303082, "ground_truth": 0}, {"key": "38080102", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548631401765, "ground_truth": 0}, {"key": "38080102", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7745833967709845, "ground_truth": 0}, {"key": "38080102", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4804786847457688, "ground_truth": 0}, {"key": "38080102", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531418702213, "ground_truth": 0}, {"key": "38080102", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.564098445204087, "ground_truth": 0}, {"key": "40244537", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6001883346118292, "ground_truth": 0}, {"key": "40244537", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5234203660816922, "ground_truth": 0}, {"key": "40244537", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6442250842681843, "ground_truth": 0}, {"key": "40244537", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216319106426, "ground_truth": 0}, {"key": "40244537", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828338666337434, "ground_truth": 0}, {"key": "33497789", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8661325018986701, "ground_truth": 0}, {"key": "33497789", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9099069920655977, "ground_truth": 0}, {"key": "33497789", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8529354819667669, "ground_truth": 0}, {"key": "33497789", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352783855893, "ground_truth": 0}, {"key": "33497789", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897193964993, "ground_truth": 0}, {"key": "28816889", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8267117885304944, "ground_truth": 0}, {"key": "28816889", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7606506392193714, "ground_truth": 0}, {"key": "28816889", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359947447751, "ground_truth": 0}, {"key": "28816889", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624639257909, "ground_truth": 0}, {"key": "28816889", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476671971979, "ground_truth": 0}, {"key": "38157127", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3557748685424399, "ground_truth": 0}, {"key": "38157127", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.23934936881783297, "ground_truth": 0}, {"key": "38157127", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.33285233656398544, "ground_truth": 0}, {"key": "38157127", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263215976365, "ground_truth": 0}, {"key": "38157127", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633809374112, "ground_truth": 0}, {"key": "36183569", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.41111087862869866, "ground_truth": 0}, {"key": "36183569", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3345894464068438, "ground_truth": 0}, {"key": "36183569", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.300745585036236, "ground_truth": 0}, {"key": "36183569", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937837898012294, "ground_truth": 0}, {"key": "36183569", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869689990103837, "ground_truth": 0}, {"key": "36012016", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7446563426479595, "ground_truth": 0}, {"key": "36012016", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6601723813386096, "ground_truth": 0}, {"key": "36012016", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.717011883018382, "ground_truth": 0}, {"key": "36012016", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337142845968, "ground_truth": 0}, {"key": "36012016", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586285829586, "ground_truth": 0}, {"key": "34571973", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6636689614249831, "ground_truth": 0}, {"key": "34571973", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.53120933075082, "ground_truth": 0}, {"key": "34571973", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4668455866980679, "ground_truth": 0}, {"key": "34571973", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "34571973", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218814919732556, "ground_truth": 0}, {"key": "38707498", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7956581105757045, "ground_truth": 0}, {"key": "38707498", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.783988464586353, "ground_truth": 0}, {"key": "38707498", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8489721981809512, "ground_truth": 0}, {"key": "38707498", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300553747382, "ground_truth": 0}, {"key": "38707498", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928968561674, "ground_truth": 0}, {"key": "35459082", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9594592627378011, "ground_truth": 0}, {"key": "35459082", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9575961671336382, "ground_truth": 0}, {"key": "35459082", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9629528303107076, "ground_truth": 0}, {"key": "35459082", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9648551546263523, "ground_truth": 0}, {"key": "35459082", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9453993960881485, "ground_truth": 0}, {"key": "39464041", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9788748086039344, "ground_truth": 0}, {"key": "39464041", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9643214483329244, "ground_truth": 0}, {"key": "39464041", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9695556524006483, "ground_truth": 0}, {"key": "39464041", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9804313225133118, "ground_truth": 0}, {"key": "39464041", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9874720685545197, "ground_truth": 0}, {"key": "23782052", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4668455745514376, "ground_truth": 0}, {"key": "23782052", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4397473271798566, "ground_truth": 0}, {"key": "23782052", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6150878673835143, "ground_truth": 0}, {"key": "23782052", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.42441200484053315, "ground_truth": 0}, {"key": "23782052", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898513879076, "ground_truth": 0}, {"key": "36568455", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6740504683675173, "ground_truth": 0}, {"key": "36568455", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7956581106834696, "ground_truth": 0}, {"key": "36568455", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8529354785095542, "ground_truth": 0}, {"key": "36568455", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.852935480008699, "ground_truth": 0}, {"key": "36568455", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163703768968, "ground_truth": 0}, {"key": "38469552", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9339146186912808, "ground_truth": 0}, {"key": "38469552", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7799929083894077, "ground_truth": 0}, {"key": "38469552", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359939042612, "ground_truth": 0}, {"key": "38469552", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9289263373366257, "ground_truth": 0}, {"key": "38469552", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891241466843, "ground_truth": 0}, {"key": "35922277", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8365545600069896, "ground_truth": 0}, {"key": "35922277", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8799743799351449, "ground_truth": 0}, {"key": "35922277", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9019206826164357, "ground_truth": 0}, {"key": "35922277", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898728715397, "ground_truth": 0}, {"key": "35922277", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755718269401, "ground_truth": 0}, {"key": "32744293", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7008948128832575, "ground_truth": 0}, {"key": "32744293", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8652240860827989, "ground_truth": 0}, {"key": "32744293", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8679338379941177, "ground_truth": 0}, {"key": "32744293", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059662557202, "ground_truth": 0}, {"key": "32744293", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191600657454, "ground_truth": 0}, {"key": "30972362", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9529258256449402, "ground_truth": 0}, {"key": "30972362", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9241418203868582, "ground_truth": 0}, {"key": "30972362", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.959762055083528, "ground_truth": 0}, {"key": "30972362", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.962952831370971, "ground_truth": 0}, {"key": "30972362", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9724147185199767, "ground_truth": 0}, {"key": "36380943", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6992544334650234, "ground_truth": 0}, {"key": "36380943", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7563575560871029, "ground_truth": 0}, {"key": "36380943", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033466207643, "ground_truth": 0}, {"key": "36380943", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738114864709, "ground_truth": 0}, {"key": "36380943", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.862467550879484, "ground_truth": 0}, {"key": "36929355", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6406358430108418, "ground_truth": 0}, {"key": "36929355", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6370308125460766, "ground_truth": 0}, {"key": "36929355", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.815232481377074, "ground_truth": 0}, {"key": "36929355", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416527464688, "ground_truth": 0}, {"key": "36929355", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033275622733, "ground_truth": 0}, {"key": "39127206", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6297746236364931, "ground_truth": 0}, {"key": "39127206", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.327668304786823, "ground_truth": 0}, {"key": "39127206", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794004341135146, "ground_truth": 0}, {"key": "39127206", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358247540793, "ground_truth": 0}, {"key": "39127206", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804689978452926, "ground_truth": 0}, {"key": "36128318", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.29746995579437685, "ground_truth": 0}, {"key": "36128318", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.18242553419734983, "ground_truth": 0}, {"key": "36128318", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.25091278477738793, "ground_truth": 0}, {"key": "36128318", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3398276326943171, "ground_truth": 0}, {"key": "36128318", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106119297783615, "ground_truth": 0}, {"key": "39863480", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9053222821179802, "ground_truth": 0}, {"key": "39863480", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8152324741473055, "ground_truth": 0}, {"key": "39863480", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8872045883160924, "ground_truth": 0}, {"key": "39863480", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366500079954, "ground_truth": 0}, {"key": "39863480", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068792221018, "ground_truth": 0}, {"key": "38634057", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8140528062724812, "ground_truth": 0}, {"key": "38634057", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7534666661085919, "ground_truth": 0}, {"key": "38634057", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8128673195155419, "ground_truth": 0}, {"key": "38634057", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224411535393, "ground_truth": 0}, {"key": "38634057", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544012040401, "ground_truth": 0}, {"key": "33131935", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8643104577327928, "ground_truth": 0}, {"key": "33131935", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.900529784095285, "ground_truth": 0}, {"key": "33131935", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7905303219834704, "ground_truth": 0}, {"key": "33131935", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094044912454, "ground_truth": 0}, {"key": "33131935", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367993132484, "ground_truth": 0}, {"key": "39021319", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.464901568494698, "ground_truth": 0}, {"key": "39021319", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39793843823052677, "ground_truth": 0}, {"key": "39021319", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.586996448733193, "ground_truth": 0}, {"key": "39021319", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089181547939, "ground_truth": 0}, {"key": "39021319", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004113401649, "ground_truth": 0}, {"key": "40644571", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6876300004860874, "ground_truth": 0}, {"key": "40644571", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3191213824737439, "ground_truth": 0}, {"key": "40644571", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6001883539607166, "ground_truth": 0}, {"key": "40644571", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.441672980458548, "ground_truth": 0}, {"key": "40644571", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.505859092539229, "ground_truth": 0}, {"key": "14681877", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9353465088904761, "ground_truth": 0}, {"key": "14681877", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9702399043570713, "ground_truth": 0}, {"key": "14681877", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9230391679824794, "ground_truth": 0}, {"key": "14681877", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9273632944365332, "ground_truth": 0}, {"key": "14681877", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.827828152112893, "ground_truth": 0}, {"key": "36570890", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5039061806344375, "ground_truth": 0}, {"key": "36570890", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.611381993987245, "ground_truth": 0}, {"key": "36570890", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494593655245, "ground_truth": 0}, {"key": "36570890", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061601446181, "ground_truth": 0}, {"key": "36570890", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.667147701205621, "ground_truth": 0}, {"key": "30452755", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8661325224479623, "ground_truth": 0}, {"key": "30452755", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7549149879061428, "ground_truth": 0}, {"key": "30452755", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8289387927515253, "ground_truth": 0}, {"key": "30452755", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163803602212, "ground_truth": 0}, {"key": "30452755", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281584309238, "ground_truth": 0}, {"key": "37347053", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5755880030173479, "ground_truth": 0}, {"key": "37347053", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4882834105907825, "ground_truth": 0}, {"key": "37347053", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.47268349482158317, "ground_truth": 0}, {"key": "37347053", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583359978959, "ground_truth": 0}, {"key": "37347053", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318196124196, "ground_truth": 0}, {"key": "38890979", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.42823342685483334, "ground_truth": 0}, {"key": "38890979", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4130035948530885, "ground_truth": 0}, {"key": "38890979", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4941409222086941, "ground_truth": 0}, {"key": "38890979", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406715426185, "ground_truth": 0}, {"key": "38890979", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315155381199, "ground_truth": 0}, {"key": "32974694", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548845641968, "ground_truth": 0}, {"key": "32974694", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7826624700945553, "ground_truth": 0}, {"key": "32974694", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7106283055026116, "ground_truth": 0}, {"key": "32974694", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307529297174, "ground_truth": 0}, {"key": "32974694", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295198011592914, "ground_truth": 0}, {"key": "38519940", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9130583378950222, "ground_truth": 0}, {"key": "38519940", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7431680217640997, "ground_truth": 0}, {"key": "38519940", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8688267632082293, "ground_truth": 0}, {"key": "38519940", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531195076799, "ground_truth": 0}, {"key": "38519940", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338502324185, "ground_truth": 0}, {"key": "38870104", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.87321482325417, "ground_truth": 0}, {"key": "38870104", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8418256491870513, "ground_truth": 0}, {"key": "38870104", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7786493368980744, "ground_truth": 0}, {"key": "38870104", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846513744116, "ground_truth": 0}, {"key": "38870104", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281467040332, "ground_truth": 0}, {"key": "34283161", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5389832331805137, "ground_truth": 0}, {"key": "34283161", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.525368830722265, "ground_truth": 0}, {"key": "34283161", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.28298811846633304, "ground_truth": 0}, {"key": "34283161", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074557228616966, "ground_truth": 0}, {"key": "34283161", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.329391716897148, "ground_truth": 0}, {"key": "31650463", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548880500906, "ground_truth": 0}, {"key": "31650463", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8056322099390781, "ground_truth": 0}, {"key": "31650463", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7106283032659687, "ground_truth": 0}, {"key": "31650463", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723570535728, "ground_truth": 0}, {"key": "31650463", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431908945127, "ground_truth": 0}, {"key": "35589432", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7676898488957012, "ground_truth": 0}, {"key": "35589432", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6150878370478873, "ground_truth": 0}, {"key": "35589432", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8333245954769678, "ground_truth": 0}, {"key": "35589432", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916228087936, "ground_truth": 0}, {"key": "35589432", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929032578145, "ground_truth": 0}, {"key": "14412752", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6636689669279473, "ground_truth": 0}, {"key": "14412752", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6706082730350295, "ground_truth": 0}, {"key": "14412752", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432206087134, "ground_truth": 0}, {"key": "14412752", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.65135488001038, "ground_truth": 0}, {"key": "14412752", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526802214319, "ground_truth": 0}, {"key": "37271183", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9289263348221316, "ground_truth": 0}, {"key": "37271183", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.950041471705524, "ground_truth": 0}, {"key": "37271183", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9815951094669596, "ground_truth": 0}, {"key": "37271183", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494723279315, "ground_truth": 0}, {"key": "37271183", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9600626850753613, "ground_truth": 0}, {"key": "35588153", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9485372301195885, "ground_truth": 0}, {"key": "35588153", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9489172657809563, "ground_truth": 0}, {"key": "35588153", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9626731103094689, "ground_truth": 0}, {"key": "35588153", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105492983003, "ground_truth": 0}, {"key": "35588153", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583421162198, "ground_truth": 0}, {"key": "39876692", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.749087194185366, "ground_truth": 0}, {"key": "39876692", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7534666365363798, "ground_truth": 0}, {"key": "39876692", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8679338325883117, "ground_truth": 0}, {"key": "39876692", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316918102342, "ground_truth": 0}, {"key": "39876692", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268349727590037, "ground_truth": 0}, {"key": "38992323", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7786493016025877, "ground_truth": 0}, {"key": "38992323", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195351979848, "ground_truth": 0}, {"key": "38992323", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8962513700621161, "ground_truth": 0}, {"key": "38992323", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690880206958, "ground_truth": 0}, {"key": "38992323", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825882588982, "ground_truth": 0}, {"key": "37556002", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8386797731967367, "ground_truth": 0}, {"key": "37556002", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6688802659582164, "ground_truth": 0}, {"key": "37556002", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9319595876300509, "ground_truth": 0}, {"key": "37556002", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338442165916, "ground_truth": 0}, {"key": "37556002", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526322222186, "ground_truth": 0}, {"key": "39875801", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8311430433556959, "ground_truth": 0}, {"key": "39875801", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7090191564969448, "ground_truth": 0}, {"key": "39875801", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8104789007966374, "ground_truth": 0}, {"key": "39875801", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424353389907, "ground_truth": 0}, {"key": "39875801", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159726617432, "ground_truth": 0}, {"key": "39272285", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.12336561381086206, "ground_truth": 0}, {"key": "39272285", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.12765261704823716, "ground_truth": 0}, {"key": "39272285", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.26284184874896077, "ground_truth": 0}, {"key": "39272285", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596071337079812, "ground_truth": 0}, {"key": "39272285", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930800465453125, "ground_truth": 0}, {"key": "39629714", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7233094480825758, "ground_truth": 0}, {"key": "39629714", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6959583402175373, "ground_truth": 0}, {"key": "39629714", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2766905339078497, "ground_truth": 0}, {"key": "39629714", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544170327019, "ground_truth": 0}, {"key": "39629714", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711485788043, "ground_truth": 0}, {"key": "34043257", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.573678399244475, "ground_truth": 0}, {"key": "34043257", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5755880179615982, "ground_truth": 0}, {"key": "34043257", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8080672116727347, "ground_truth": 0}, {"key": "34043257", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933332563675, "ground_truth": 0}, {"key": "34043257", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352830043492, "ground_truth": 0}, {"key": "33995240", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47463117855678233, "ground_truth": 0}, {"key": "33995240", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5926666243815499, "ground_truth": 0}, {"key": "33995240", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6909762799075564, "ground_truth": 0}, {"key": "33995240", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814376630729, "ground_truth": 0}, {"key": "33995240", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218814214506573, "ground_truth": 0}, {"key": "39399948", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9092645113546096, "ground_truth": 0}, {"key": "39399948", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6187804020049784, "ground_truth": 0}, {"key": "39399948", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477982029753334, "ground_truth": 0}, {"key": "39399948", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210640754162, "ground_truth": 0}, {"key": "39399948", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582587655483, "ground_truth": 0}, {"key": "33185890", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7057850348268072, "ground_truth": 0}, {"key": "33185890", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159490499062, "ground_truth": 0}, {"key": "33185890", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8104789140727503, "ground_truth": 0}, {"key": "33185890", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432083386071, "ground_truth": 0}, {"key": "33185890", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437723036924, "ground_truth": 0}, {"key": "35280425", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8386797706510779, "ground_truth": 0}, {"key": "35280425", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5983121994350967, "ground_truth": 0}, {"key": "35280425", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7264256221286703, "ground_truth": 0}, {"key": "35280425", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686302376824, "ground_truth": 0}, {"key": "35280425", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711720279739, "ground_truth": 0}, {"key": "16365170", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8333246142056031, "ground_truth": 0}, {"key": "16365170", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8998277915524805, "ground_truth": 0}, {"key": "16365170", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9213576150756999, "ground_truth": 0}, {"key": "16365170", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281464311577, "ground_truth": 0}, {"key": "16365170", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178998599845, "ground_truth": 0}, {"key": "24388238", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.653126926735203, "ground_truth": 0}, {"key": "24388238", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49804691034231663, "ground_truth": 0}, {"key": "24388238", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5774953841543978, "ground_truth": 0}, {"key": "24388238", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883485986097, "ground_truth": 0}, {"key": "24388238", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947176182152, "ground_truth": 0}, {"key": "35024827", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7577943701366197, "ground_truth": 0}, {"key": "35024827", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7549149825376624, "ground_truth": 0}, {"key": "35024827", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7008948336811449, "ground_truth": 0}, {"key": "35024827", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159684124543, "ground_truth": 0}, {"key": "35024827", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165172551767, "ground_truth": 0}, {"key": "38624944", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7732163714532353, "ground_truth": 0}, {"key": "38624944", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7690802357926942, "ground_truth": 0}, {"key": "38624944", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5679366338331936, "ground_truth": 0}, {"key": "38624944", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423336304142, "ground_truth": 0}, {"key": "38624944", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919978611178, "ground_truth": 0}, {"key": "34719830", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7866228264907057, "ground_truth": 0}, {"key": "34719830", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8092759674029812, "ground_truth": 0}, {"key": "34719830", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7839884591925512, "ground_truth": 0}, {"key": "34719830", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549448542397, "ground_truth": 0}, {"key": "34719830", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802441416759, "ground_truth": 0}, {"key": "38995225", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.42441197382435875, "ground_truth": 0}, {"key": "38995225", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.542863275014105, "ground_truth": 0}, {"key": "38995225", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5851011691376561, "ground_truth": 0}, {"key": "38995225", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800761414803, "ground_truth": 0}, {"key": "38995225", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047585580442223, "ground_truth": 0}, {"key": "34242311", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7401743541295682, "ground_truth": 0}, {"key": "34242311", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6388352669901713, "ground_truth": 0}, {"key": "34242311", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.684264011242772, "ground_truth": 0}, {"key": "34242311", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.763483773663673, "ground_truth": 0}, {"key": "34242311", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789140676737, "ground_truth": 0}, {"key": "39253748", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8175744871206093, "ground_truth": 0}, {"key": "39253748", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8365545747682909, "ground_truth": 0}, {"key": "39253748", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.787931196397549, "ground_truth": 0}, {"key": "39253748", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933498423173, "ground_truth": 0}, {"key": "39253748", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307487281503, "ground_truth": 0}, {"key": "37131104", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9947391478326716, "ground_truth": 0}, {"key": "37131104", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9959927109180395, "ground_truth": 0}, {"key": "37131104", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9958012044789146, "ground_truth": 0}, {"key": "37131104", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9924812813266359, "ground_truth": 0}, {"key": "37131104", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9884918515440585, "ground_truth": 0}, {"key": "38490554", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8164063839353518, "ground_truth": 0}, {"key": "38490554", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7981867748920206, "ground_truth": 0}, {"key": "38490554", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8221891222251017, "ground_truth": 0}, {"key": "38490554", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414745981661, "ground_truth": 0}, {"key": "38490554", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338374803136, "ground_truth": 0}, {"key": "29009500", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37937838795255874, "ground_truth": 0}, {"key": "29009500", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.447460285197772, "ground_truth": 0}, {"key": "29009500", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5331544139180684, "ground_truth": 0}, {"key": "29009500", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463117654742987, "ground_truth": 0}, {"key": "29009500", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381546337599, "ground_truth": 0}, {"key": "36703057", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5409238900431053, "ground_truth": 0}, {"key": "36703057", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5813031039856341, "ground_truth": 0}, {"key": "36703057", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837580800304, "ground_truth": 0}, {"key": "36703057", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352881086798, "ground_truth": 0}, {"key": "36703057", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118781868265, "ground_truth": 0}, {"key": "34876987", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.893309410557785, "ground_truth": 0}, {"key": "34876987", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.887984047118188, "ground_truth": 0}, {"key": "34876987", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8799743792203578, "ground_truth": 0}, {"key": "34876987", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122270997198, "ground_truth": 0}, {"key": "34876987", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615381951918749, "ground_truth": 0}, {"key": "36209258", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8044058990794972, "ground_truth": 0}, {"key": "36209258", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.876634379244108, "ground_truth": 0}, {"key": "36209258", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8056322026827446, "ground_truth": 0}, {"key": "36209258", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324780361413, "ground_truth": 0}, {"key": "36209258", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916181368783, "ground_truth": 0}, {"key": "36854437", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.350421366962009, "ground_truth": 0}, {"key": "36854437", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4148988713895323, "ground_truth": 0}, {"key": "36854437", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3830641756090133, "ground_truth": 0}, {"key": "36854437", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.25832598327676626, "ground_truth": 0}, {"key": "36854437", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781086239522845, "ground_truth": 0}, {"key": "38047723", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.21601152874337956, "ground_truth": 0}, {"key": "38047723", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.27512972126246754, "ground_truth": 0}, {"key": "38047723", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1311732224215571, "ground_truth": 0}, {"key": "38047723", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2479874339977935, "ground_truth": 0}, {"key": "38047723", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713685495163124, "ground_truth": 0}, {"key": "34287816", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5370414216628441, "ground_truth": 0}, {"key": "34287816", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5486734905868641, "ground_truth": 0}, {"key": "34287816", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5506073519404926, "ground_truth": 0}, {"key": "34287816", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619229031073514, "ground_truth": 0}, {"key": "34287816", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891659899339, "ground_truth": 0}, {"key": "33235855", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.949669364253888, "ground_truth": 0}, {"key": "33235855", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9597620548668775, "ground_truth": 0}, {"key": "33235855", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9817357224564583, "ground_truth": 0}, {"key": "33235855", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9600626863974664, "ground_truth": 0}, {"key": "33235855", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.926303735361163, "ground_truth": 0}, {"key": "34381016", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7772998644009612, "ground_truth": 0}, {"key": "34381016", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7505527721565965, "ground_truth": 0}, {"key": "34381016", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8198933287922457, "ground_truth": 0}, {"key": "34381016", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300617465139, "ground_truth": 0}, {"key": "34381016", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047099338735, "ground_truth": 0}, {"key": "28064995", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6334102499911649, "ground_truth": 0}, {"key": "28064995", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8031738023569144, "ground_truth": 0}, {"key": "28064995", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5983121743100835, "ground_truth": 0}, {"key": "28064995", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633152436969374, "ground_truth": 0}, {"key": "28064995", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.42823340667759263, "ground_truth": 0}, {"key": "37576197", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31742625970207416, "ground_truth": 0}, {"key": "37576197", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.538983226739408, "ground_truth": 0}, {"key": "37576197", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5525396975474979, "ground_truth": 0}, {"key": "37576197", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116470265991174, "ground_truth": 0}, {"key": "37576197", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684668976645, "ground_truth": 0}, {"key": "34454741", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.42059957360359146, "ground_truth": 0}, {"key": "34454741", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48242911174851566, "ground_truth": 0}, {"key": "34454741", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46101676561078986, "ground_truth": 0}, {"key": "34454741", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46879061655271287, "ground_truth": 0}, {"key": "34454741", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414223541498, "ground_truth": 0}, {"key": "34766970", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30902371587024785, "ground_truth": 0}, {"key": "34766970", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2861692695218957, "ground_truth": 0}, {"key": "34766970", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1801066579849941, "ground_truth": 0}, {"key": "34766970", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.39420092505434423, "ground_truth": 0}, {"key": "34766970", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742628660480554, "ground_truth": 0}, {"key": "35574186", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7969253734919377, "ground_truth": 0}, {"key": "35574186", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7416740187014735, "ground_truth": 0}, {"key": "35574186", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8289388181683908, "ground_truth": 0}, {"key": "35574186", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677635741621, "ground_truth": 0}, {"key": "35574186", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786396348129, "ground_truth": 0}, {"key": "35486470", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5409238504593022, "ground_truth": 0}, {"key": "35486470", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4339814894737137, "ground_truth": 0}, {"key": "35486470", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6495785933701498, "ground_truth": 0}, {"key": "35486470", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448014191639099, "ground_truth": 0}, {"key": "35486470", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333863983429, "ground_truth": 0}, {"key": "40977702", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6187804242880289, "ground_truth": 0}, {"key": "40977702", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6774740018745995, "ground_truth": 0}, {"key": "40977702", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7341195364311542, "ground_truth": 0}, {"key": "40977702", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.44360041258829974, "ground_truth": 0}, {"key": "40977702", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "35336618", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9073122255703925, "ground_truth": 0}, {"key": "35336618", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8267118015576422, "ground_truth": 0}, {"key": "35336618", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9407897466351679, "ground_truth": 0}, {"key": "35336618", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297866748656, "ground_truth": 0}, {"key": "35336618", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9549844698689438, "ground_truth": 0}, {"key": "33024679", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6477982222221991, "ground_truth": 0}, {"key": "33024679", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5448013905375255, "ground_truth": 0}, {"key": "33024679", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8438950966357325, "ground_truth": 0}, {"key": "33024679", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689515239503, "ground_truth": 0}, {"key": "33024679", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125585036829, "ground_truth": 0}, {"key": "37451334", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6279512341108753, "ground_truth": 0}, {"key": "37451334", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6150878769124688, "ground_truth": 0}, {"key": "37451334", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7866228179220855, "ground_truth": 0}, {"key": "37451334", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998537387944, "ground_truth": 0}, {"key": "37451334", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745087495622, "ground_truth": 0}, {"key": "33354824", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.45519860683383107, "ground_truth": 0}, {"key": "33354824", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5621764899315757, "ground_truth": 0}, {"key": "33354824", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3157359575328311, "ground_truth": 0}, {"key": "33354824", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3684056951993748, "ground_truth": 0}, {"key": "33354824", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384251278179, "ground_truth": 0}, {"key": "34688538", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6169358634371365, "ground_truth": 0}, {"key": "34688538", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6671476822086476, "ground_truth": 0}, {"key": "34688538", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794004205237302, "ground_truth": 0}, {"key": "34688538", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4111108746327477, "ground_truth": 0}, {"key": "34688538", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45713668885712744, "ground_truth": 0}, {"key": "33646276", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3793783940821568, "ground_truth": 0}, {"key": "33646276", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41111088951055524, "ground_truth": 0}, {"key": "33646276", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "33646276", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2766905298734179, "ground_truth": 0}, {"key": "33646276", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646151688731, "ground_truth": 0}, {"key": "40322608", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9394706097997608, "ground_truth": 0}, {"key": "40322608", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.907967131944416, "ground_truth": 0}, {"key": "40322608", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.91964254159832, "ground_truth": 0}, {"key": "40322608", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127686311474, "ground_truth": 0}, {"key": "40322608", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9353465102101102, "ground_truth": 0}, {"key": "39565762", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8233284032430549, "ground_truth": 0}, {"key": "39565762", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7853086078414327, "ground_truth": 0}, {"key": "39565762", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5583269758996446, "ground_truth": 0}, {"key": "39565762", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884514780721, "ground_truth": 0}, {"key": "39565762", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897340155318, "ground_truth": 0}, {"key": "30534259", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8519528167675656, "ground_truth": 0}, {"key": "30534259", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6959583223932158, "ground_truth": 0}, {"key": "30534259", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8140528006699606, "ground_truth": 0}, {"key": "30534259", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.668880276826999, "ground_truth": 0}, {"key": "30534259", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581672887937, "ground_truth": 0}, {"key": "39644242", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7577943661773592, "ground_truth": 0}, {"key": "39644242", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7772998747438403, "ground_truth": 0}, {"key": "39644242", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7704647951276524, "ground_truth": 0}, {"key": "39644242", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585576945684, "ground_truth": 0}, {"key": "39644242", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.744656361285025, "ground_truth": 0}, {"key": "19853740", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6654105730180602, "ground_truth": 0}, {"key": "19853740", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6206215945698265, "ground_truth": 0}, {"key": "19853740", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8519527833241217, "ground_truth": 0}, {"key": "19853740", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789247174382, "ground_truth": 0}, {"key": "19853740", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936520615447, "ground_truth": 0}, {"key": "33023078", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.857768103872801, "ground_truth": 0}, {"key": "33023078", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8783142396916499, "ground_truth": 0}, {"key": "33023078", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8679338489281204, "ground_truth": 0}, {"key": "33023078", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867854787673, "ground_truth": 0}, {"key": "33023078", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253930407675, "ground_truth": 0}, {"key": "38329806", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3208213077782051, "ground_truth": 0}, {"key": "38329806", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2628418587741592, "ground_truth": 0}, {"key": "38329806", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6636689703576527, "ground_truth": 0}, {"key": "38329806", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633106004803465, "ground_truth": 0}, {"key": "38329806", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408803432233, "ground_truth": 0}, {"key": "38761942", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4785288215949574, "ground_truth": 0}, {"key": "38761942", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819562141083, "ground_truth": 0}, {"key": "38761942", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4571367077128673, "ground_truth": 0}, {"key": "38761942", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800762066008, "ground_truth": 0}, {"key": "38761942", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33111973270671957, "ground_truth": 0}, {"key": "33773576", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872134971933, "ground_truth": 0}, {"key": "33773576", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7866228108789157, "ground_truth": 0}, {"key": "33773576", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7446563629488073, "ground_truth": 0}, {"key": "33773576", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137150524184, "ground_truth": 0}, {"key": "33773576", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185944063920291, "ground_truth": 0}, {"key": "37642631", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7905303274434824, "ground_truth": 0}, {"key": "37642631", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7325918445020552, "ground_truth": 0}, {"key": "37642631", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6619228936569981, "ground_truth": 0}, {"key": "37642631", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241566643286, "ground_truth": 0}, {"key": "37642631", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701083782865, "ground_truth": 0}, {"key": "36609836", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7461390067783333, "ground_truth": 0}, {"key": "36609836", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7969253560554641, "ground_truth": 0}, {"key": "36609836", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9339146254760531, "ground_truth": 0}, {"key": "36609836", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575568617052, "ground_truth": 0}, {"key": "36609836", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099587630114, "ground_truth": 0}, {"key": "41035610", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548587923845, "ground_truth": 0}, {"key": "41035610", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6723317044317318, "ground_truth": 0}, {"key": "41035610", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7371581743757825, "ground_truth": 0}, {"key": "41035610", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943808856721, "ground_truth": 0}, {"key": "41035610", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365543382476, "ground_truth": 0}, {"key": "37592684", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5506073757946353, "ground_truth": 0}, {"key": "37592684", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7563575820505252, "ground_truth": 0}, {"key": "37592684", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8300437817951067, "ground_truth": 0}, {"key": "37592684", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357730104772, "ground_truth": 0}, {"key": "37592684", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916145787761, "ground_truth": 0}, {"key": "38951040", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6584174876568085, "ground_truth": 0}, {"key": "38951040", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.615087852514354, "ground_truth": 0}, {"key": "38951040", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6825737359593228, "ground_truth": 0}, {"key": "38951040", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.60766319345714, "ground_truth": 0}, {"key": "38951040", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476745825872, "ground_truth": 0}, {"key": "40774469", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.15713684566220518, "ground_truth": 0}, {"key": "40774469", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.11047114476358143, "ground_truth": 0}, {"key": "40774469", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.19072402168742686, "ground_truth": 0}, {"key": "40774469", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882834047768371, "ground_truth": 0}, {"key": "40774469", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894543458364, "ground_truth": 0}, {"key": "40876288", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7279754387798755, "ground_truth": 0}, {"key": "40876288", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6774740003524831, "ground_truth": 0}, {"key": "40876288", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.646013707497195, "ground_truth": 0}, {"key": "40876288", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122119326048, "ground_truth": 0}, {"key": "40876288", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011468592328, "ground_truth": 0}, {"key": "40340131", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5679366269002589, "ground_truth": 0}, {"key": "40340131", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7969253765915465, "ground_truth": 0}, {"key": "40340131", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6893056600945575, "ground_truth": 0}, {"key": "40340131", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197852678352, "ground_truth": 0}, {"key": "40340131", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743618981227, "ground_truth": 0}, {"key": "30121591", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6706082981140212, "ground_truth": 0}, {"key": "30121591", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7154240038096369, "ground_truth": 0}, {"key": "30121591", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.399811644399244, "ground_truth": 0}, {"key": "30121591", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366450424636, "ground_truth": 0}, {"key": "30121591", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646131410727, "ground_truth": 0}, {"key": "35623366", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8548846446590006, "ground_truth": 0}, {"key": "35623366", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41869692173835366, "ground_truth": 0}, {"key": "35623366", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8044059111200377, "ground_truth": 0}, {"key": "35623366", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632828100337, "ground_truth": 0}, {"key": "35623366", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837727561983, "ground_truth": 0}, {"key": "41014093", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6584174915080901, "ground_truth": 0}, {"key": "41014093", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5832033471516281, "ground_truth": 0}, {"key": "41014093", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7041601431057947, "ground_truth": 0}, {"key": "41014093", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.653126916193451, "ground_truth": 0}, {"key": "41014093", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.594551271280421, "ground_truth": 0}, {"key": "11387984", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8615382086593929, "ground_truth": 0}, {"key": "11387984", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7201714863831737, "ground_truth": 0}, {"key": "11387984", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7981867688148399, "ground_truth": 0}, {"key": "11387984", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424433619275, "ground_truth": 0}, {"key": "11387984", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430509673405, "ground_truth": 0}, {"key": "39508312", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4378235071407581, "ground_truth": 0}, {"key": "39508312", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6187804325730321, "ground_truth": 0}, {"key": "39508312", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6723316906135298, "ground_truth": 0}, {"key": "39508312", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512683089729, "ground_truth": 0}, {"key": "39508312", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.562176510522825, "ground_truth": 0}, {"key": "35815369", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4339814624164463, "ground_truth": 0}, {"key": "35815369", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4687906410099359, "ground_truth": 0}, {"key": "35815369", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5679366297019561, "ground_truth": 0}, {"key": "35815369", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358492856007, "ground_truth": 0}, {"key": "35815369", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175709070537009, "ground_truth": 0}, {"key": "35802823", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8128673151104239, "ground_truth": 0}, {"key": "35802823", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7431680128698683, "ground_truth": 0}, {"key": "35802823", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7310585748539388, "ground_truth": 0}, {"key": "35802823", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590153440445284, "ground_truth": 0}, {"key": "35802823", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337116598763, "ground_truth": 0}, {"key": "38499968", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8300437694049247, "ground_truth": 0}, {"key": "38499968", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6774740093099647, "ground_truth": 0}, {"key": "38499968", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7279754511245929, "ground_truth": 0}, {"key": "38499968", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943709255245, "ground_truth": 0}, {"key": "38499968", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545618289444, "ground_truth": 0}, {"key": "36926726", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548463358891, "ground_truth": 0}, {"key": "36926726", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7918210545057804, "ground_truth": 0}, {"key": "36926726", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8438950963898342, "ground_truth": 0}, {"key": "36926726", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681003268989, "ground_truth": 0}, {"key": "36926726", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.767689859772828, "ground_truth": 0}, {"key": "40903712", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8044059073022921, "ground_truth": 0}, {"key": "40903712", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7892336888709991, "ground_truth": 0}, {"key": "40903712", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7918210721455792, "ground_truth": 0}, {"key": "40903712", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677635575631, "ground_truth": 0}, {"key": "40903712", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339634054105, "ground_truth": 0}, {"key": "19614862", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7057850412484424, "ground_truth": 0}, {"key": "19614862", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3276682784523373, "ground_truth": 0}, {"key": "19614862", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7008948452639462, "ground_truth": 0}, {"key": "19614862", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210650843993, "ground_truth": 0}, {"key": "19614862", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665996778161, "ground_truth": 0}, {"key": "38861704", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4765796395050234, "ground_truth": 0}, {"key": "38861704", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4824291309394147, "ground_truth": 0}, {"key": "38861704", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4921881324957321, "ground_truth": 0}, {"key": "38861704", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324852743617, "ground_truth": 0}, {"key": "38861704", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224430745209, "ground_truth": 0}, {"key": "34349607", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44360038491915854, "ground_truth": 0}, {"key": "34349607", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4941409022182374, "ground_truth": 0}, {"key": "34349607", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3208212747813884, "ground_truth": 0}, {"key": "34349607", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213606087975, "ground_truth": 0}, {"key": "34349607", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2704802144960288, "ground_truth": 0}, {"key": "20773800", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.09401018047232526, "ground_truth": 0}, {"key": "20773800", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.06705629172206744, "ground_truth": 0}, {"key": "20773800", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.05877655935319308, "ground_truth": 0}, {"key": "20773800", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.051845467507357225, "ground_truth": 0}, {"key": "20773800", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.11047114657704218, "ground_truth": 0}, {"key": "35545608", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6113819840728284, "ground_truth": 0}, {"key": "35545608", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.30569731892643004, "ground_truth": 0}, {"key": "35545608", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.39793842238298216, "ground_truth": 0}, {"key": "35545608", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891245973972, "ground_truth": 0}, {"key": "35545608", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474602911811485, "ground_truth": 0}, {"key": "37258984", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548699741226, "ground_truth": 0}, {"key": "37258984", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5136684672777584, "ground_truth": 0}, {"key": "37258984", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5058591096860359, "ground_truth": 0}, {"key": "37258984", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708587981137, "ground_truth": 0}, {"key": "37258984", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318102269386, "ground_truth": 0}, {"key": "37274562", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6531269102164562, "ground_truth": 0}, {"key": "37274562", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7839884915410266, "ground_truth": 0}, {"key": "37274562", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8187367896310026, "ground_truth": 0}, {"key": "37274562", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215450187562, "ground_truth": 0}, {"key": "37274562", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424215505129, "ground_truth": 0}, {"key": "40828068", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9073122201956558, "ground_truth": 0}, {"key": "40828068", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8278281607116337, "ground_truth": 0}, {"key": "40828068", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8244619370103877, "ground_truth": 0}, {"key": "40828068", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681144149997, "ground_truth": 0}, {"key": "40828068", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159429920356, "ground_truth": 0}, {"key": "37807180", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6774739991884379, "ground_truth": 0}, {"key": "37807180", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8198933453821521, "ground_truth": 0}, {"key": "37807180", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8278281470936345, "ground_truth": 0}, {"key": "37807180", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.79818678454954, "ground_truth": 0}, {"key": "37807180", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423182407222, "ground_truth": 0}, {"key": "40748607", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9635062303347687, "ground_truth": 0}, {"key": "40748607", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.976129165942917, "ground_truth": 0}, {"key": "40748607", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9818752797424354, "ground_truth": 0}, {"key": "40748607", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9719924791093989, "ground_truth": 0}, {"key": "40748607", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9795114450796656, "ground_truth": 0}, {"key": "40123819", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9224823400871804, "ground_truth": 0}, {"key": "40123819", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.852935473963822, "ground_truth": 0}, {"key": "40123819", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8633916041538863, "ground_truth": 0}, {"key": "40123819", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.881614901567619, "ground_truth": 0}, {"key": "40123819", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145732973642, "ground_truth": 0}, {"key": "38453867", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8221891239912702, "ground_truth": 0}, {"key": "38453867", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5926665835206145, "ground_truth": 0}, {"key": "38453867", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5583269973336933, "ground_truth": 0}, {"key": "38453867", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163636778049, "ground_truth": 0}, {"key": "38453867", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512284656621, "ground_truth": 0}, {"key": "38944856", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.836554566285401, "ground_truth": 0}, {"key": "38944856", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8998277853978913, "ground_truth": 0}, {"key": "38944856", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7956580829298041, "ground_truth": 0}, {"key": "38944856", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9105453954569778, "ground_truth": 0}, {"key": "38944856", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175058449596, "ground_truth": 0}, {"key": "35778898", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8210441006618753, "ground_truth": 0}, {"key": "35778898", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8255897254974639, "ground_truth": 0}, {"key": "35778898", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.848972200323767, "ground_truth": 0}, {"key": "35778898", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070135769315, "ground_truth": 0}, {"key": "35778898", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.890294218804478, "ground_truth": 0}, {"key": "32530125", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47852882809358477, "ground_truth": 0}, {"key": "32530125", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2974699429719936, "ground_truth": 0}, {"key": "32530125", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1993080102952409, "ground_truth": 0}, {"key": "32530125", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43206337719021354, "ground_truth": 0}, {"key": "32530125", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953521275572594, "ground_truth": 0}, {"key": "35010363", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6076631392120267, "ground_truth": 0}, {"key": "35010363", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.25683198773161564, "ground_truth": 0}, {"key": "35010363", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6076631707400482, "ground_truth": 0}, {"key": "35010363", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317278829664, "ground_truth": 0}, {"key": "35010363", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704727756776, "ground_truth": 0}, {"key": "27514800", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8697145808086324, "ground_truth": 0}, {"key": "27514800", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7662936451458272, "ground_truth": 0}, {"key": "27514800", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8714748585926219, "ground_truth": 0}, {"key": "27514800", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432060605411, "ground_truth": 0}, {"key": "27514800", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840468704192, "ground_truth": 0}, {"key": "25725840", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2598256431809312, "ground_truth": 0}, {"key": "25725840", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.14706451901078568, "ground_truth": 0}, {"key": "25725840", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2494472521124712, "ground_truth": 0}, {"key": "25725840", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.24944724432232712, "ground_truth": 0}, {"key": "25725840", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.18476749694266617, "ground_truth": 0}, {"key": "38327225", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.677474016090964, "ground_truth": 0}, {"key": "38327225", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40168779905674545, "ground_truth": 0}, {"key": "38327225", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6442251002192113, "ground_truth": 0}, {"key": "38327225", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487600722799, "ground_truth": 0}, {"key": "38327225", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085948418159, "ground_truth": 0}, {"key": "11991724", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.846957834491674, "ground_truth": 0}, {"key": "11991724", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.743167986859434, "ground_truth": 0}, {"key": "11991724", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9441768592193233, "ground_truth": 0}, {"key": "11991724", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240814189606, "ground_truth": 0}, {"key": "11991724", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.867933852434637, "ground_truth": 0}, {"key": "32217545", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947265637427, "ground_truth": 0}, {"key": "32217545", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6774739955669895, "ground_truth": 0}, {"key": "32217545", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8365545603774517, "ground_truth": 0}, {"key": "32217545", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526433955418, "ground_truth": 0}, {"key": "32217545", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804156256972, "ground_truth": 0}, {"key": "12731847", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011327240634, "ground_truth": 0}, {"key": "12731847", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49414088262719363, "ground_truth": 0}, {"key": "12731847", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.37754065838084355, "ground_truth": 0}, {"key": "12731847", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158251286881985, "ground_truth": 0}, {"key": "12731847", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240129463623, "ground_truth": 0}, {"key": "36827234", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7476159408939429, "ground_truth": 0}, {"key": "36827234", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5544704661246412, "ground_truth": 0}, {"key": "36827234", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7759445466791737, "ground_truth": 0}, {"key": "36827234", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802700133679, "ground_truth": 0}, {"key": "36827234", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068809059496, "ground_truth": 0}, {"key": "29111539", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6020615565628018, "ground_truth": 0}, {"key": "29111539", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8519527991872258, "ground_truth": 0}, {"key": "29111539", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8152324793993935, "ground_truth": 0}, {"key": "29111539", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754587788404, "ground_truth": 0}, {"key": "29111539", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303133666909, "ground_truth": 0}, {"key": "37763052", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6876299959142944, "ground_truth": 0}, {"key": "37763052", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7563575438275417, "ground_truth": 0}, {"key": "37763052", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8164063704618724, "ground_truth": 0}, {"key": "37763052", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354736171932, "ground_truth": 0}, {"key": "37763052", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365615250328, "ground_truth": 0}, {"key": "30682335", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4493926155042236, "ground_truth": 0}, {"key": "30682335", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6723317137205149, "ground_truth": 0}, {"key": "30682335", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3433417493237871, "ground_truth": 0}, {"key": "30682335", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.36296918369907166, "ground_truth": 0}, {"key": "30682335", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982315250639, "ground_truth": 0}, {"key": "12261276", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.044680871778411395, "ground_truth": 0}, {"key": "12261276", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.20181322269126284, "ground_truth": 0}, {"key": "12261276", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.11596071099163753, "ground_truth": 0}, {"key": "12261276", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.10743747507044399, "ground_truth": 0}, {"key": "12261276", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1208532375168424, "ground_truth": 0}, {"key": "36912979", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4186969202935455, "ground_truth": 0}, {"key": "36912979", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39047584101926597, "ground_truth": 0}, {"key": "36912979", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45519861817471025, "ground_truth": 0}, {"key": "36912979", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.550607369346371, "ground_truth": 0}, {"key": "36912979", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473305975839, "ground_truth": 0}, {"key": "30205259", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8152324822299191, "ground_truth": 0}, {"key": "30205259", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8068526215481789, "ground_truth": 0}, {"key": "30205259", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8289388201196034, "ground_truth": 0}, {"key": "30205259", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059116892583, "ground_truth": 0}, {"key": "30205259", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284161049783, "ground_truth": 0}, {"key": "39458032", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9755769116490586, "ground_truth": 0}, {"key": "39458032", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9706877686063833, "ground_truth": 0}, {"key": "39458032", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9026096042269053, "ground_truth": 0}, {"key": "39458032", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437758516508, "ground_truth": 0}, {"key": "39458032", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9796676473295739, "ground_truth": 0}, {"key": "35116452", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2213506918802694, "ground_truth": 0}, {"key": "35116452", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3398275954763828, "ground_truth": 0}, {"key": "35116452", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.23370634779906518, "ground_truth": 0}, {"key": "35116452", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1993080085704176, "ground_truth": 0}, {"key": "35116452", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.17441028001609488, "ground_truth": 0}, {"key": "40107476", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7866228164312681, "ground_truth": 0}, {"key": "40107476", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8577680959813052, "ground_truth": 0}, {"key": "40107476", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8449215430196881, "ground_truth": 0}, {"key": "40107476", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215154183048, "ground_truth": 0}, {"key": "40107476", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797459342824, "ground_truth": 0}, {"key": "39501049", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9445872055476491, "ground_truth": 0}, {"key": "39501049", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9626731133607054, "ground_truth": 0}, {"key": "39501049", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9445872032823114, "ground_truth": 0}, {"key": "39501049", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759580140286, "ground_truth": 0}, {"key": "39501049", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9294404026310312, "ground_truth": 0}, {"key": "39642178", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4649015818327793, "ground_truth": 0}, {"key": "39642178", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7505527416419027, "ground_truth": 0}, {"key": "39642178", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2628418331188132, "ground_truth": 0}, {"key": "39642178", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228684049053, "ground_truth": 0}, {"key": "39642178", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048022652368553, "ground_truth": 0}, {"key": "38024796", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.38676342639742417, "ground_truth": 0}, {"key": "38024796", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3007455670033547, "ground_truth": 0}, {"key": "38024796", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.21469142512561923, "ground_truth": 0}, {"key": "38024796", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359014938829537, "ground_truth": 0}, {"key": "38024796", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.051845467314791664, "ground_truth": 0}, {"key": "36652079", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5370413850690333, "ground_truth": 0}, {"key": "36652079", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7879311964181257, "ground_truth": 0}, {"key": "36652079", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7041601315089415, "ground_truth": 0}, {"key": "36652079", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026579205294, "ground_truth": 0}, {"key": "36652079", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832092021488, "ground_truth": 0}, {"key": "32193402", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8864204044859362, "ground_truth": 0}, {"key": "32193402", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7295197715821521, "ground_truth": 0}, {"key": "32193402", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8933093988276398, "ground_truth": 0}, {"key": "32193402", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9246876875722811, "ground_truth": 0}, {"key": "32193402", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105463869053, "ground_truth": 0}, {"key": "32589706", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6740504664442751, "ground_truth": 0}, {"key": "32589706", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8080672073316129, "ground_truth": 0}, {"key": "32589706", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6842640174164416, "ground_truth": 0}, {"key": "32589706", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210799862018, "ground_truth": 0}, {"key": "32589706", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837570215728, "ground_truth": 0}, {"key": "38590589", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7122322079913126, "ground_truth": 0}, {"key": "38590589", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7446563618394688, "ground_truth": 0}, {"key": "38590589", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217431930749318, "ground_truth": 0}, {"key": "38590589", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884398898096, "ground_truth": 0}, {"key": "38590589", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389960079436, "ground_truth": 0}, {"key": "37045414", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9822877008818894, "ground_truth": 0}, {"key": "37045414", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9912208912248737, "ground_truth": 0}, {"key": "37045414", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9835969674982874, "ground_truth": 0}, {"key": "37045414", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9884918507730858, "ground_truth": 0}, {"key": "37045414", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.982690905097747, "ground_truth": 0}, {"key": "33310095", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8548846404068107, "ground_truth": 0}, {"key": "33310095", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6584174926486709, "ground_truth": 0}, {"key": "33310095", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5640984847602829, "ground_truth": 0}, {"key": "33310095", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9572778046195722, "ground_truth": 0}, {"key": "33310095", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085816040003, "ground_truth": 0}, {"key": "37934604", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7879311947643353, "ground_truth": 0}, {"key": "37934604", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159351408209, "ground_truth": 0}, {"key": "37934604", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8633916217252646, "ground_truth": 0}, {"key": "37934604", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867693866999, "ground_truth": 0}, {"key": "37934604", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314700733522, "ground_truth": 0}, {"key": "39012181", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9874720665641998, "ground_truth": 0}, {"key": "39012181", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9828232902009353, "ground_truth": 0}, {"key": "39012181", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9912886161573826, "ground_truth": 0}, {"key": "39012181", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9886682452155452, "ground_truth": 0}, {"key": "39012181", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9932024677050321, "ground_truth": 0}, {"key": "40221674", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9802808722299737, "ground_truth": 0}, {"key": "40221674", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8940517171285584, "ground_truth": 0}, {"key": "40221674", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9771973644341972, "ground_truth": 0}, {"key": "40221674", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9556514204161496, "ground_truth": 0}, {"key": "40221674", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9651191128912324, "ground_truth": 0}, {"key": "36884862", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8289388169018816, "ground_truth": 0}, {"key": "36884862", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8848377794486648, "ground_truth": 0}, {"key": "36884862", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7786492958400376, "ground_truth": 0}, {"key": "36884862", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118690292737, "ground_truth": 0}, {"key": "36884862", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339767871842, "ground_truth": 0}, {"key": "39054429", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5175708663674772, "ground_truth": 0}, {"key": "39054429", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.54867351201656, "ground_truth": 0}, {"key": "39054429", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30735801316849315, "ground_truth": 0}, {"key": "39054429", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3157359822746656, "ground_truth": 0}, {"key": "39054429", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48047868645113234, "ground_truth": 0}, {"key": "36753964", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3720488018950758, "ground_truth": 0}, {"key": "36753964", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3923368350471498, "ground_truth": 0}, {"key": "36753964", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5945512492287224, "ground_truth": 0}, {"key": "36753964", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334172761948045, "ground_truth": 0}, {"key": "36753964", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360040039309584, "ground_truth": 0}, {"key": "37612459", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5563995821688784, "ground_truth": 0}, {"key": "37612459", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6442250913609927, "ground_truth": 0}, {"key": "37612459", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6132365605894095, "ground_truth": 0}, {"key": "37612459", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011497614605, "ground_truth": 0}, {"key": "37612459", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583251879975, "ground_truth": 0}, {"key": "36805789", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8606036188405811, "ground_truth": 0}, {"key": "36805789", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8962513696518132, "ground_truth": 0}, {"key": "36805789", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8577681062765001, "ground_truth": 0}, {"key": "36805789", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.858718583545282, "ground_truth": 0}, {"key": "36805789", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804402936208, "ground_truth": 0}, {"key": "12757394", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6825737448482252, "ground_truth": 0}, {"key": "12757394", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5888891298611963, "ground_truth": 0}, {"key": "12757394", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6242935432782203, "ground_truth": 0}, {"key": "12757394", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102673840865, "ground_truth": 0}, {"key": "12757394", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117166126326742, "ground_truth": 0}, {"key": "32192542", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9066531207479861, "ground_truth": 0}, {"key": "32192542", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8933094006165776, "ground_truth": 0}, {"key": "32192542", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.919063291258921, "ground_truth": 0}, {"key": "32192542", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872045934100055, "ground_truth": 0}, {"key": "32192542", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391653667455, "ground_truth": 0}, {"key": "34856060", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6460137197024179, "ground_truth": 0}, {"key": "34856060", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3923368373840159, "ground_truth": 0}, {"key": "34856060", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6388352819649885, "ground_truth": 0}, {"key": "34856060", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784146518242, "ground_truth": 0}, {"key": "34856060", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990601687371, "ground_truth": 0}, {"key": "36083416", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8766343688652208, "ground_truth": 0}, {"key": "36083416", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.819893342866653, "ground_truth": 0}, {"key": "36083416", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8688267774350333, "ground_truth": 0}, {"key": "36083416", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240927181916, "ground_truth": 0}, {"key": "36083416", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.891811040036772, "ground_truth": 0}, {"key": "33839050", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44746025770233916, "ground_truth": 0}, {"key": "33839050", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.43014737160236494, "ground_truth": 0}, {"key": "33839050", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.29259529873931556, "ground_truth": 0}, {"key": "33839050", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894643474256, "ground_truth": 0}, {"key": "33839050", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641425362239, "ground_truth": 0}, {"key": "18464690", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.640635859808875, "ground_truth": 0}, {"key": "18464690", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6859494585796518, "ground_truth": 0}, {"key": "18464690", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.656658264353107, "ground_truth": 0}, {"key": "18464690", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295178781439, "ground_truth": 0}, {"key": "18464690", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414086149915, "ground_truth": 0}, {"key": "39212665", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.1259227767534645, "ground_truth": 0}, {"key": "39212665", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1530421552189817, "ground_truth": 0}, {"key": "39212665", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.13753247209973352, "ground_truth": 0}, {"key": "39212665", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2056150476422904, "ground_truth": 0}, {"key": "39212665", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610490002098887, "ground_truth": 0}, {"key": "40094011", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.644225109572327, "ground_truth": 0}, {"key": "40094011", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7217432066588709, "ground_truth": 0}, {"key": "40094011", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.781330615974996, "ground_truth": 0}, {"key": "40094011", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916100576375, "ground_truth": 0}, {"key": "40094011", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982216823854, "ground_truth": 0}, {"key": "36036272", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6206216344619488, "ground_truth": 0}, {"key": "36036272", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6654105525267695, "ground_truth": 0}, {"key": "36036272", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5602526558835176, "ground_truth": 0}, {"key": "36036272", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787157572866, "ground_truth": 0}, {"key": "36036272", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094716820697, "ground_truth": 0}, {"key": "30681904", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6566582544278974, "ground_truth": 0}, {"key": "30681904", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47657965235648625, "ground_truth": 0}, {"key": "30681904", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5312093651369647, "ground_truth": 0}, {"key": "30681904", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166106830741, "ground_truth": 0}, {"key": "30681904", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397007221478, "ground_truth": 0}, {"key": "27834240", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.12336561898864767, "ground_truth": 0}, {"key": "27834240", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.26133091003713316, "ground_truth": 0}, {"key": "27834240", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.21469140775190929, "ground_truth": 0}, {"key": "27834240", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.17217185209526936, "ground_truth": 0}, {"key": "27834240", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.18359363185316388, "ground_truth": 0}, {"key": "35025075", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3276682977726258, "ground_truth": 0}, {"key": "35025075", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786034131994, "ground_truth": 0}, {"key": "35025075", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5888891243809782, "ground_truth": 0}, {"key": "35025075", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593179630773, "ground_truth": 0}, {"key": "35025075", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244119967861273, "ground_truth": 0}, {"key": "33316985", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8732148396071405, "ground_truth": 0}, {"key": "33316985", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7676898568171744, "ground_truth": 0}, {"key": "33316985", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7386690932681472, "ground_truth": 0}, {"key": "33316985", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118656757739, "ground_truth": 0}, {"key": "33316985", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525396844249396, "ground_truth": 0}, {"key": "17037056", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.28937169279721664, "ground_truth": 0}, {"key": "17037056", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3056973233411659, "ground_truth": 0}, {"key": "17037056", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.47657966549240677, "ground_truth": 0}, {"key": "17037056", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276683043824901, "ground_truth": 0}, {"key": "17037056", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252600227185846, "ground_truth": 0}, {"key": "34050457", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7325918284722338, "ground_truth": 0}, {"key": "34050457", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7233094610886495, "ground_truth": 0}, {"key": "34050457", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8104788881047057, "ground_truth": 0}, {"key": "34050457", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026788285819, "ground_truth": 0}, {"key": "34050457", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673240981893, "ground_truth": 0}, {"key": "34713745", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4785288099362289, "ground_truth": 0}, {"key": "34713745", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5253688093879865, "ground_truth": 0}, {"key": "34713745", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4785288416111176, "ground_truth": 0}, {"key": "34713745", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33982759525474787, "ground_truth": 0}, {"key": "34713745", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.353986296437335, "ground_truth": 0}, {"key": "40856210", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.10087861920884605, "ground_truth": 0}, {"key": "40856210", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.17441027115009425, "ground_truth": 0}, {"key": "40856210", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.14804718662928187, "ground_truth": 0}, {"key": "40856210", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1732882113085645, "ground_truth": 0}, {"key": "40856210", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.09947021543727351, "ground_truth": 0}, {"key": "40848302", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7549149948459556, "ground_truth": 0}, {"key": "40848302", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8104789266324952, "ground_truth": 0}, {"key": "40848302", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201715061587118, "ground_truth": 0}, {"key": "40848302", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647810467284, "ground_truth": 0}, {"key": "40848302", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527565185783, "ground_truth": 0}, {"key": "40636168", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2974699388843412, "ground_truth": 0}, {"key": "40636168", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5389832195113489, "ground_truth": 0}, {"key": "40636168", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36658970079831515, "ground_truth": 0}, {"key": "40636168", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964546917563, "ground_truth": 0}, {"key": "40636168", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406772150679, "ground_truth": 0}, {"key": "34423311", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6671476958050597, "ground_truth": 0}, {"key": "34423311", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3174262555536325, "ground_truth": 0}, {"key": "34423311", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.723309479945793, "ground_truth": 0}, {"key": "34423311", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990499452084, "ground_truth": 0}, {"key": "34423311", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061757218204, "ground_truth": 0}, {"key": "34833945", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9278877976579761, "ground_truth": 0}, {"key": "34833945", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9585377324059542, "ground_truth": 0}, {"key": "34833945", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9449947162040094, "ground_truth": 0}, {"key": "34833945", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9852713861548434, "ground_truth": 0}, {"key": "34833945", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429286016198022, "ground_truth": 0}, {"key": "21272328", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.1384617955832434, "ground_truth": 0}, {"key": "21272328", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6297746136919363, "ground_truth": 0}, {"key": "21272328", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5234203190369268, "ground_truth": 0}, {"key": "21272328", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417447916121, "ground_truth": 0}, {"key": "21272328", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2628418243971535, "ground_truth": 0}, {"key": "38648957", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4225046487581761, "ground_truth": 0}, {"key": "38648957", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.21206881268416924, "ground_truth": 0}, {"key": "38648957", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4687906227506477, "ground_truth": 0}, {"key": "38648957", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510837861587225, "ground_truth": 0}, {"key": "38648957", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850224108645, "ground_truth": 0}, {"key": "24942981", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2704802001932201, "ground_truth": 0}, {"key": "24942981", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.12168574677825363, "ground_truth": 0}, {"key": "24942981", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.38306414145080186, "ground_truth": 0}, {"key": "24942981", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1431877146391919, "ground_truth": 0}, {"key": "24942981", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451645852698724, "ground_truth": 0}, {"key": "35882366", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2186693671932842, "ground_truth": 0}, {"key": "35882366", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.757794370970517, "ground_truth": 0}, {"key": "35882366", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.13477592294209848, "ground_truth": 0}, {"key": "35882366", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.379378372404039, "ground_truth": 0}, {"key": "35882366", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.276690535606797, "ground_truth": 0}, {"key": "40559523", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201715092653345, "ground_truth": 0}, {"key": "40559523", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256191582054, "ground_truth": 0}, {"key": "40559523", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7704647926504756, "ground_truth": 0}, {"key": "40559523", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419742743521, "ground_truth": 0}, {"key": "40559523", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849617279315, "ground_truth": 0}, {"key": "24632722", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5983121937512786, "ground_truth": 0}, {"key": "24632722", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.30239106515182007, "ground_truth": 0}, {"key": "24632722", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3629692182296653, "ground_truth": 0}, {"key": "24632722", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512522912909, "ground_truth": 0}, {"key": "24632722", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759749656397, "ground_truth": 0}, {"key": "36002759", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4282333868577445, "ground_truth": 0}, {"key": "36002759", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4668455825000708, "ground_truth": 0}, {"key": "36002759", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6334102579391633, "ground_truth": 0}, {"key": "36002759", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.31069440605791854, "ground_truth": 0}, {"key": "36002759", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270035867264, "ground_truth": 0}, {"key": "29508534", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8210441025134269, "ground_truth": 0}, {"key": "29508534", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786348102928, "ground_truth": 0}, {"key": "29508534", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.754914980963501, "ground_truth": 0}, {"key": "29508534", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754572953877, "ground_truth": 0}, {"key": "29508534", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804689080825465, "ground_truth": 0}, {"key": "15631612", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8984105532675737, "ground_truth": 0}, {"key": "15631612", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8529354901861047, "ground_truth": 0}, {"key": "15631612", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8438950928686312, "ground_truth": 0}, {"key": "15631612", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281484504858, "ground_truth": 0}, {"key": "15631612", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748642857616, "ground_truth": 0}, {"key": "40731892", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.1623800390268423, "ground_truth": 0}, {"key": "40731892", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.21866939063795465, "ground_truth": 0}, {"key": "40731892", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.19806417856093547, "ground_truth": 0}, {"key": "40731892", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3140505138012127, "ground_truth": 0}, {"key": "40731892", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2598256402555947, "ground_truth": 0}, {"key": "35971910", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.880797072132246, "ground_truth": 0}, {"key": "35971910", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9339146179716614, "ground_truth": 0}, {"key": "35971910", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8376199641659243, "ground_truth": 0}, {"key": "35971910", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9190632984010978, "ground_truth": 0}, {"key": "35971910", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152325032483925, "ground_truth": 0}, {"key": "34428424", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9441768540299783, "ground_truth": 0}, {"key": "34428424", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9686195710572115, "ground_truth": 0}, {"key": "34428424", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9807288616830114, "ground_truth": 0}, {"key": "34428424", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9732407191533035, "ground_truth": 0}, {"key": "34428424", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.981021961311223, "ground_truth": 0}, {"key": "36971005", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9532750439371392, "ground_truth": 0}, {"key": "36971005", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9196425341865473, "ground_truth": 0}, {"key": "36971005", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8856314687437625, "ground_truth": 0}, {"key": "36971005", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583410973672, "ground_truth": 0}, {"key": "36971005", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767895204707, "ground_truth": 0}, {"key": "34649067", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2942150026216722, "ground_truth": 0}, {"key": "34649067", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3345894173155974, "ground_truth": 0}, {"key": "34649067", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.23091975983305726, "ground_truth": 0}, {"key": "34649067", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.24220563729007286, "ground_truth": 0}, {"key": "34649067", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.20817894172851908, "ground_truth": 0}, {"key": "37355154", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.12852513349137715, "ground_truth": 0}, {"key": "37355154", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.31742625068152563, "ground_truth": 0}, {"key": "37355154", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.26435836963096637, "ground_truth": 0}, {"key": "37355154", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2658804872481113, "ground_truth": 0}, {"key": "37355154", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735743651921319, "ground_truth": 0}, {"key": "38674697", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47852884472718576, "ground_truth": 0}, {"key": "38674697", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.25683197717227885, "ground_truth": 0}, {"key": "38674697", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4843800585968538, "ground_truth": 0}, {"key": "38674697", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.32766828973050727, "ground_truth": 0}, {"key": "38674697", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015416511406, "ground_truth": 0}, {"key": "40525767", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9908743621364018, "ground_truth": 0}, {"key": "40525767", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9954967274197783, "ground_truth": 0}, {"key": "40525767", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.98840263871139, "ground_truth": 0}, {"key": "40525767", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9916195460660825, "ground_truth": 0}, {"key": "40525767", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9859363727012277, "ground_truth": 0}, {"key": "27165110", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.14608724613776844, "ground_truth": 0}, {"key": "27165110", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.24077460874392123, "ground_truth": 0}, {"key": "27165110", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.13296424315393143, "ground_truth": 0}, {"key": "27165110", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943826403968, "ground_truth": 0}, {"key": "27165110", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1143685210116158, "ground_truth": 0}, {"key": "35497491", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7577943610505833, "ground_truth": 0}, {"key": "35497491", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6601723780829867, "ground_truth": 0}, {"key": "35497491", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6169358435464404, "ground_truth": 0}, {"key": "35497491", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947431514207, "ground_truth": 0}, {"key": "35497491", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.785308588309738, "ground_truth": 0}, {"key": "40690716", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7799929046485764, "ground_truth": 0}, {"key": "40690716", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9026096077570789, "ground_truth": 0}, {"key": "40690716", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9230391668419635, "ground_truth": 0}, {"key": "40690716", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099584669234, "ground_truth": 0}, {"key": "40690716", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418248632147, "ground_truth": 0}, {"key": "34835193", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9618217225654686, "ground_truth": 0}, {"key": "34835193", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9810219643183743, "ground_truth": 0}, {"key": "34835193", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9764905460717795, "ground_truth": 0}, {"key": "34835193", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9793540704314947, "ground_truth": 0}, {"key": "34835193", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9868787283848421, "ground_truth": 0}, {"key": "39471712", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011495544431, "ground_truth": 0}, {"key": "39471712", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5679366225494134, "ground_truth": 0}, {"key": "39471712", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.544801404304801, "ground_truth": 0}, {"key": "39471712", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646130142991, "ground_truth": 0}, {"key": "39471712", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256154136828, "ground_truth": 0}, {"key": "39115192", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.844921526974137, "ground_truth": 0}, {"key": "39115192", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7549149798715401, "ground_truth": 0}, {"key": "39115192", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201715165224245, "ground_truth": 0}, {"key": "39115192", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906300122574, "ground_truth": 0}, {"key": "39115192", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213111526213, "ground_truth": 0}, {"key": "23520673", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.32939171265068296, "ground_truth": 0}, {"key": "23520673", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38676344262328116, "ground_truth": 0}, {"key": "23520673", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36477754369917076, "ground_truth": 0}, {"key": "23520673", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279511900068717, "ground_truth": 0}, {"key": "23520673", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204877000007885, "ground_truth": 0}, {"key": "35764233", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7592254295914067, "ground_truth": 0}, {"key": "35764233", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49414088296008013, "ground_truth": 0}, {"key": "35764233", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4054487440091543, "ground_truth": 0}, {"key": "35764233", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.345105262257252, "ground_truth": 0}, {"key": "35764233", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2186693839371341, "ground_truth": 0}, {"key": "35228910", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.315735981679199, "ground_truth": 0}, {"key": "35228910", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37570645166584904, "ground_truth": 0}, {"key": "35228910", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2782567844818269, "ground_truth": 0}, {"key": "35228910", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687307200236756, "ground_truth": 0}, {"key": "35228910", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781087372910304, "ground_truth": 0}, {"key": "36795599", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9219218324364317, "ground_truth": 0}, {"key": "36795599", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9142907150311659, "ground_truth": 0}, {"key": "36795599", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9268352750569787, "ground_truth": 0}, {"key": "36795599", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.942081909578198, "ground_truth": 0}, {"key": "36795599", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907175424297, "ground_truth": 0}, {"key": "38641949", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7956580999755797, "ground_truth": 0}, {"key": "38641949", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8519528015963793, "ground_truth": 0}, {"key": "38641949", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6992544159187484, "ground_truth": 0}, {"key": "38641949", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943891173244, "ground_truth": 0}, {"key": "38641949", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423231655848, "ground_truth": 0}, {"key": "29968443", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9111797176061761, "ground_truth": 0}, {"key": "29968443", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.927887787277533, "ground_truth": 0}, {"key": "29968443", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9683812315007648, "ground_truth": 0}, {"key": "29968443", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110389983926, "ground_truth": 0}, {"key": "29968443", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9358173610908244, "ground_truth": 0}, {"key": "21268042", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48633154459007594, "ground_truth": 0}, {"key": "21268042", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8031737881149124, "ground_truth": 0}, {"key": "21268042", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7371581579713736, "ground_truth": 0}, {"key": "21268042", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366578991368, "ground_truth": 0}, {"key": "21268042", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754658639594, "ground_truth": 0}, {"key": "26808572", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.675764580169975, "ground_truth": 0}, {"key": "26808572", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4263216133565149, "ground_truth": 0}, {"key": "26808572", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6688802677637407, "ground_truth": 0}, {"key": "26808572", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837516329681, "ground_truth": 0}, {"key": "26808572", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068889643272, "ground_truth": 0}, {"key": "37829390", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7356416047152111, "ground_truth": 0}, {"key": "37829390", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8244619252202064, "ground_truth": 0}, {"key": "37829390", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9046505325981173, "ground_truth": 0}, {"key": "37829390", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267836487938, "ground_truth": 0}, {"key": "37829390", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802270467436, "ground_truth": 0}, {"key": "35716045", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8469578589996584, "ground_truth": 0}, {"key": "35716045", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8947894705289663, "ground_truth": 0}, {"key": "35716045", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8539127435464041, "ground_truth": 0}, {"key": "35716045", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195272547484, "ground_truth": 0}, {"key": "35716045", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297879585074, "ground_truth": 0}, {"key": "34367070", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8428631559673999, "ground_truth": 0}, {"key": "34367070", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9039745124594638, "ground_truth": 0}, {"key": "34367070", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8615381993378388, "ground_truth": 0}, {"key": "34367070", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646986304553, "ground_truth": 0}, {"key": "34367070", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.787931197034813, "ground_truth": 0}, {"key": "35239748", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872266355988, "ground_truth": 0}, {"key": "35239748", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6671476517454116, "ground_truth": 0}, {"key": "35239748", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43206339616228395, "ground_truth": 0}, {"key": "35239748", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056066535662, "ground_truth": 0}, {"key": "35239748", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283843551638, "ground_truth": 0}, {"key": "40421370", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6992544166102017, "ground_truth": 0}, {"key": "40421370", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5794003863762176, "ground_truth": 0}, {"key": "40421370", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4785288480219765, "ground_truth": 0}, {"key": "40421370", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269988854156, "ground_truth": 0}, {"key": "40421370", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966518290371, "ground_truth": 0}, {"key": "37288396", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8175744802244294, "ground_truth": 0}, {"key": "37288396", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4244119639228986, "ground_truth": 0}, {"key": "37288396", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7170119084774074, "ground_truth": 0}, {"key": "37288396", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575609685237, "ground_truth": 0}, {"key": "37288396", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059725608318, "ground_truth": 0}, {"key": "38903688", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8732148289997135, "ground_truth": 0}, {"key": "38903688", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9420819118146476, "ground_truth": 0}, {"key": "38903688", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8824278634684165, "ground_truth": 0}, {"key": "38903688", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9246876899371056, "ground_truth": 0}, {"key": "38903688", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578399213028, "ground_truth": 0}, {"key": "28071228", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8499711854853277, "ground_truth": 0}, {"key": "28071228", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9458012684453212, "ground_truth": 0}, {"key": "28071228", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8568122846164984, "ground_truth": 0}, {"key": "28071228", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099510886807, "ground_truth": 0}, {"key": "28071228", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117932290443, "ground_truth": 0}, {"key": "36855834", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.42059960397067553, "ground_truth": 0}, {"key": "36855834", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984685928492, "ground_truth": 0}, {"key": "36855834", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.35042139305638026, "ground_truth": 0}, {"key": "36855834", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064574056117, "ground_truth": 0}, {"key": "36855834", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.284576012061048, "ground_truth": 0}, {"key": "40548717", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4980468777437546, "ground_truth": 0}, {"key": "40548717", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5078118687529671, "ground_truth": 0}, {"key": "40548717", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4263215875133868, "ground_truth": 0}, {"key": "40548717", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582585114935, "ground_truth": 0}, {"key": "40548717", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073334065887696, "ground_truth": 0}, {"key": "37051175", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7416740078171156, "ground_truth": 0}, {"key": "37051175", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7690802327861745, "ground_truth": 0}, {"key": "37051175", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5253688585587241, "ground_truth": 0}, {"key": "37051175", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585894198173, "ground_truth": 0}, {"key": "37051175", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.860603625629994, "ground_truth": 0}, {"key": "38882119", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.76489161624821, "ground_truth": 0}, {"key": "38882119", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942945020756, "ground_truth": 0}, {"key": "38882119", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7170118734428531, "ground_truth": 0}, {"key": "38882119", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819550003731, "ground_truth": 0}, {"key": "38882119", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723701099872, "ground_truth": 0}, {"key": "19485402", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7356416421565565, "ground_truth": 0}, {"key": "19485402", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942982786165, "ground_truth": 0}, {"key": "19485402", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.861538212255825, "ground_truth": 0}, {"key": "19485402", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251222750285, "ground_truth": 0}, {"key": "19485402", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512065253446, "ground_truth": 0}, {"key": "36060907", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6876300049129574, "ground_truth": 0}, {"key": "36060907", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5698526490892952, "ground_truth": 0}, {"key": "36060907", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7356416516572537, "ground_truth": 0}, {"key": "36060907", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746010513537, "ground_truth": 0}, {"key": "36060907", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878564086524, "ground_truth": 0}, {"key": "24037309", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5774953681269339, "ground_truth": 0}, {"key": "24037309", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7325918128457858, "ground_truth": 0}, {"key": "24037309", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8449215315211566, "ground_truth": 0}, {"key": "24037309", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.924141824385482, "ground_truth": 0}, {"key": "24037309", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740303126681, "ground_truth": 0}, {"key": "35605805", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6909762885174224, "ground_truth": 0}, {"key": "35605805", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7431680285552944, "ground_truth": 0}, {"key": "35605805", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6388352599911499, "ground_truth": 0}, {"key": "35605805", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.717011880845279, "ground_truth": 0}, {"key": "35605805", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307400455881, "ground_truth": 0}, {"key": "17706248", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4980468862014369, "ground_truth": 0}, {"key": "17706248", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.34334176099933805, "ground_truth": 0}, {"key": "17706248", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30902371960555564, "ground_truth": 0}, {"key": "17706248", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185028216782, "ground_truth": 0}, {"key": "17706248", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360039783638516, "ground_truth": 0}, {"key": "36883559", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5964331431635103, "ground_truth": 0}, {"key": "36883559", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984928334067, "ground_truth": 0}, {"key": "36883559", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837742970029, "ground_truth": 0}, {"key": "36883559", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476705194876, "ground_truth": 0}, {"key": "36883559", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.642432487830919, "ground_truth": 0}, {"key": "32799471", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8031738009528231, "ground_truth": 0}, {"key": "32799471", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7866228034420473, "ground_truth": 0}, {"key": "32799471", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7866228182601328, "ground_truth": 0}, {"key": "32799471", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578501496162, "ground_truth": 0}, {"key": "32799471", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283129614636, "ground_truth": 0}, {"key": "34797243", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4649015907933149, "ground_truth": 0}, {"key": "34797243", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37570645299120387, "ground_truth": 0}, {"key": "34797243", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.670608264945807, "ground_truth": 0}, {"key": "34797243", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386100799202715, "ground_truth": 0}, {"key": "34797243", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590760992408574, "ground_truth": 0}, {"key": "32154876", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47657968775872434, "ground_truth": 0}, {"key": "32154876", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2893716984208949, "ground_truth": 0}, {"key": "32154876", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3702253755615191, "ground_truth": 0}, {"key": "32154876", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740816149727875, "ground_truth": 0}, {"key": "32154876", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048022555384643, "ground_truth": 0}, {"key": "37962274", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7905303190719165, "ground_truth": 0}, {"key": "37962274", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7759445677759718, "ground_truth": 0}, {"key": "37962274", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5156199366358128, "ground_truth": 0}, {"key": "37962274", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.710628305146996, "ground_truth": 0}, {"key": "37962274", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956581000696025, "ground_truth": 0}, {"key": "35574030", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6842640263021104, "ground_truth": 0}, {"key": "35574030", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6791787103611084, "ground_truth": 0}, {"key": "35574030", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9111797036541937, "ground_truth": 0}, {"key": "35574030", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026758225999, "ground_truth": 0}, {"key": "35574030", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195250878382, "ground_truth": 0}, {"key": "39105949", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.65489472294661, "ground_truth": 0}, {"key": "39105949", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7154239974908168, "ground_truth": 0}, {"key": "39105949", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6169358334368921, "ground_truth": 0}, {"key": "39105949", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.702530049587102, "ground_truth": 0}, {"key": "39105949", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715181172171, "ground_truth": 0}, {"key": "41064322", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9536217952292726, "ground_truth": 0}, {"key": "41064322", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9569571482975046, "ground_truth": 0}, {"key": "41064322", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9492946355099618, "ground_truth": 0}, {"key": "41064322", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.960361158328655, "ground_truth": 0}, {"key": "41064322", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.946596667506933, "ground_truth": 0}, {"key": "28105101", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8376199764016246, "ground_truth": 0}, {"key": "28105101", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8031737979512585, "ground_truth": 0}, {"key": "28105101", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7577943738994728, "ground_truth": 0}, {"key": "28105101", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142463099599, "ground_truth": 0}, {"key": "28105101", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.841825648188134, "ground_truth": 0}, {"key": "36036068", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6584174829423254, "ground_truth": 0}, {"key": "36036068", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4551986001430704, "ground_truth": 0}, {"key": "36036068", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089105238725, "ground_truth": 0}, {"key": "36036068", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026736065226, "ground_truth": 0}, {"key": "36036068", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786387150002, "ground_truth": 0}, {"key": "37991460", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8438950922344419, "ground_truth": 0}, {"key": "37991460", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8175744620281853, "ground_truth": 0}, {"key": "37991460", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5253688416820289, "ground_truth": 0}, {"key": "37991460", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673104045759, "ground_truth": 0}, {"key": "37991460", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228623747546, "ground_truth": 0}, {"key": "38437830", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6460137225235364, "ground_truth": 0}, {"key": "38437830", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.638835312760184, "ground_truth": 0}, {"key": "38437830", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8104789124032455, "ground_truth": 0}, {"key": "38437830", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797601621081, "ground_truth": 0}, {"key": "38437830", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744766292079, "ground_truth": 0}, {"key": "36507138", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947504107925, "ground_truth": 0}, {"key": "36507138", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "36507138", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40168779877480554, "ground_truth": 0}, {"key": "36507138", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711537567176, "ground_truth": 0}, {"key": "36507138", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786724868448, "ground_truth": 0}, {"key": "37824866", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8278281525008877, "ground_truth": 0}, {"key": "37824866", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9039745050720029, "ground_truth": 0}, {"key": "37824866", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7799928995010142, "ground_truth": 0}, {"key": "37824866", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493190810624, "ground_truth": 0}, {"key": "37824866", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121928797874, "ground_truth": 0}, {"key": "25088134", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5058591122622356, "ground_truth": 0}, {"key": "25088134", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6619228991638854, "ground_truth": 0}, {"key": "25088134", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5331544093571824, "ground_truth": 0}, {"key": "25088134", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268346463819705, "ground_truth": 0}, {"key": "25088134", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.527316539458014, "ground_truth": 0}, {"key": "40172531", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7648916307972047, "ground_truth": 0}, {"key": "40172531", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.814052807834685, "ground_truth": 0}, {"key": "40172531", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7057850453663984, "ground_truth": 0}, {"key": "40172531", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951049189547, "ground_truth": 0}, {"key": "40172531", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575424925969, "ground_truth": 0}, {"key": "37035874", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.372048789492272, "ground_truth": 0}, {"key": "37035874", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4436004468736966, "ground_truth": 0}, {"key": "37035874", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.29583983464628194, "ground_truth": 0}, {"key": "37035874", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054486991851965, "ground_truth": 0}, {"key": "37035874", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398714819721, "ground_truth": 0}, {"key": "36404465", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9801292875982437, "ground_truth": 0}, {"key": "36404465", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9845754475214801, "ground_truth": 0}, {"key": "36404465", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9695556519872902, "ground_truth": 0}, {"key": "36404465", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9559813496278594, "ground_truth": 0}, {"key": "36404465", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9693241977650935, "ground_truth": 0}, {"key": "39602052", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7295197755400593, "ground_truth": 0}, {"key": "39602052", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8933094018302887, "ground_truth": 0}, {"key": "39602052", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.884837771134621, "ground_truth": 0}, {"key": "39602052", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325056028468, "ground_truth": 0}, {"key": "39602052", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625273279436, "ground_truth": 0}, {"key": "33792789", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6909762892412673, "ground_truth": 0}, {"key": "33792789", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5717665752299862, "ground_truth": 0}, {"key": "33792789", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.771843513851638, "ground_truth": 0}, {"key": "33792789", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228419104283, "ground_truth": 0}, {"key": "33792789", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956581035257497, "ground_truth": 0}, {"key": "32776626", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7718434948251817, "ground_truth": 0}, {"key": "32776626", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7505527649508632, "ground_truth": 0}, {"key": "32776626", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.546738145650911, "ground_truth": 0}, {"key": "32776626", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723968460054, "ground_truth": 0}, {"key": "32776626", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935396332956, "ground_truth": 0}, {"key": "37195090", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5253688143048857, "ground_truth": 0}, {"key": "37195090", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5370413963604981, "ground_truth": 0}, {"key": "37195090", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5563995731241127, "ground_truth": 0}, {"key": "37195090", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167882588243, "ground_truth": 0}, {"key": "37195090", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011785727603, "ground_truth": 0}, {"key": "33981824", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.22405545103835026, "ground_truth": 0}, {"key": "33981824", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3276683012188554, "ground_truth": 0}, {"key": "33981824", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.18126321236076312, "ground_truth": 0}, {"key": "33981824", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.16559311529062154, "ground_truth": 0}, {"key": "33981824", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307462618144198, "ground_truth": 0}, {"key": "39569142", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.20817894344699633, "ground_truth": 0}, {"key": "39569142", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40922077934321965, "ground_truth": 0}, {"key": "39569142", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3575675147234204, "ground_truth": 0}, {"key": "39569142", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418351498749, "ground_truth": 0}, {"key": "39569142", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974735626656886, "ground_truth": 0}, {"key": "40268210", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8289388226432558, "ground_truth": 0}, {"key": "40268210", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185329676738, "ground_truth": 0}, {"key": "40268210", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8006920076183959, "ground_truth": 0}, {"key": "40268210", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122960976605, "ground_truth": 0}, {"key": "40268210", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619346344123, "ground_truth": 0}, {"key": "34925159", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8198933207548531, "ground_truth": 0}, {"key": "34925159", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5983121961138885, "ground_truth": 0}, {"key": "34925159", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8289388062315073, "ground_truth": 0}, {"key": "34925159", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314721106712, "ground_truth": 0}, {"key": "34925159", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105453837198362, "ground_truth": 0}, {"key": "36181903", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9609517039349191, "ground_truth": 0}, {"key": "36181903", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9005297902156807, "ground_truth": 0}, {"key": "36181903", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.939470604955432, "ground_truth": 0}, {"key": "36181903", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9329437153814236, "ground_truth": 0}, {"key": "36181903", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9666631771242796, "ground_truth": 0}, {"key": "38620559", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9230391590097818, "ground_truth": 0}, {"key": "38620559", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9334308185861525, "ground_truth": 0}, {"key": "38620559", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8940517111772295, "ground_truth": 0}, {"key": "38620559", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9289263292302329, "ground_truth": 0}, {"key": "38620559", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505382811344, "ground_truth": 0}, {"key": "32719657", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3398276183959436, "ground_truth": 0}, {"key": "32719657", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.803173783799176, "ground_truth": 0}, {"key": "32719657", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.39047582363684097, "ground_truth": 0}, {"key": "32719657", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852882639920924, "ground_truth": 0}, {"key": "32719657", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238640083035, "ground_truth": 0}, {"key": "37530914", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4804786918636298, "ground_truth": 0}, {"key": "37530914", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38676345833711945, "ground_truth": 0}, {"key": "37530914", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40922078240947973, "ground_truth": 0}, {"key": "37530914", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197805118607, "ground_truth": 0}, {"key": "37530914", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.312369990592074, "ground_truth": 0}, {"key": "33306933", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8643104582738101, "ground_truth": 0}, {"key": "33306933", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9362850037789721, "ground_truth": 0}, {"key": "33306933", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.957596170275529, "ground_truth": 0}, {"key": "33306933", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916177945058, "ground_truth": 0}, {"key": "33306933", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179851679101, "ground_truth": 0}, {"key": "33837212", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7772998703431252, "ground_truth": 0}, {"key": "33837212", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6601723630015608, "ground_truth": 0}, {"key": "33837212", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8080671984161347, "ground_truth": 0}, {"key": "33837212", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339646945859, "ground_truth": 0}, {"key": "33837212", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.633410272188085, "ground_truth": 0}, {"key": "40945179", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7676898589568887, "ground_truth": 0}, {"key": "40945179", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5736784210956539, "ground_truth": 0}, {"key": "40945179", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8019358381501904, "ground_truth": 0}, {"key": "40945179", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191427717528, "ground_truth": 0}, {"key": "40945179", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494400097469, "ground_truth": 0}, {"key": "34152358", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5964331595719204, "ground_truth": 0}, {"key": "34152358", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6959583262739345, "ground_truth": 0}, {"key": "34152358", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4746312093994504, "ground_truth": 0}, {"key": "34152358", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307733154686, "ground_truth": 0}, {"key": "34152358", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015482166488, "ground_truth": 0}, {"key": "34136541", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.825589725712792, "ground_truth": 0}, {"key": "34136541", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8031738124649767, "ground_truth": 0}, {"key": "34136541", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7853085897321205, "ground_truth": 0}, {"key": "34136541", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9273632958086632, "ground_truth": 0}, {"key": "34136541", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068973810455, "ground_truth": 0}, {"key": "37469603", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6039318400201056, "ground_truth": 0}, {"key": "37469603", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6388352737441565, "ground_truth": 0}, {"key": "37469603", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6723317205453877, "ground_truth": 0}, {"key": "37469603", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583302843786, "ground_truth": 0}, {"key": "37469603", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935102151995, "ground_truth": 0}, {"key": "37353611", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9582261134243619, "ground_truth": 0}, {"key": "37353611", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9399133507225248, "ground_truth": 0}, {"key": "37353611", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8697145792241666, "ground_truth": 0}, {"key": "37353611", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352728299993, "ground_truth": 0}, {"key": "37353611", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583345990766, "ground_truth": 0}, {"key": "37211649", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5888891299521495, "ground_truth": 0}, {"key": "37211649", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7154239935244907, "ground_truth": 0}, {"key": "37211649", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6132365870214921, "ground_truth": 0}, {"key": "37211649", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004231072666, "ground_truth": 0}, {"key": "37211649", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011625419258, "ground_truth": 0}, {"key": "37320976", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7505527847314121, "ground_truth": 0}, {"key": "37320976", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.596433148995344, "ground_truth": 0}, {"key": "37320976", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7745833917530707, "ground_truth": 0}, {"key": "37320976", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339711542207, "ground_truth": 0}, {"key": "37320976", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389682373357, "ground_truth": 0}, {"key": "34492412", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8479677649681892, "ground_truth": 0}, {"key": "34492412", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4980468798464049, "ground_truth": 0}, {"key": "34492412", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9496693659546573, "ground_truth": 0}, {"key": "34492412", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789037963336, "ground_truth": 0}, {"key": "34492412", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.778649308703466, "ground_truth": 0}, {"key": "36655016", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8976952867604986, "ground_truth": 0}, {"key": "36655016", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9504109769773971, "ground_truth": 0}, {"key": "36655016", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9489172657718908, "ground_truth": 0}, {"key": "36655016", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9407897500808882, "ground_truth": 0}, {"key": "36655016", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9294403980413487, "ground_truth": 0}, {"key": "35220773", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6619228728675662, "ground_truth": 0}, {"key": "35220773", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5078118535298749, "ground_truth": 0}, {"key": "35220773", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7918210680080846, "ground_truth": 0}, {"key": "35220773", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786982990767, "ground_truth": 0}, {"key": "35220773", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125726660787, "ground_truth": 0}, {"key": "31569808", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7041601389314617, "ground_truth": 0}, {"key": "31569808", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.517570889793473, "ground_truth": 0}, {"key": "31569808", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3904758160933701, "ground_truth": 0}, {"key": "31569808", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213013631904, "ground_truth": 0}, {"key": "31569808", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982201828234, "ground_truth": 0}, {"key": "37696256", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6406358514212898, "ground_truth": 0}, {"key": "37696256", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6095241797207139, "ground_truth": 0}, {"key": "37696256", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6671476731372047, "ground_truth": 0}, {"key": "37696256", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413643239054, "ground_truth": 0}, {"key": "37696256", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.521471176392468, "ground_truth": 0}, {"key": "36874328", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.737158169847287, "ground_truth": 0}, {"key": "36874328", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7634837959167453, "ground_truth": 0}, {"key": "36874328", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8092759822555387, "ground_truth": 0}, {"key": "36874328", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104468387941, "ground_truth": 0}, {"key": "36874328", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105602263854, "ground_truth": 0}, {"key": "24532377", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2523840470863562, "ground_truth": 0}, {"key": "24532377", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2509127818597159, "ground_truth": 0}, {"key": "24532377", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.28140560284301946, "ground_truth": 0}, {"key": "24532377", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952108856246933, "ground_truth": 0}, {"key": "24532377", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3191213816245911, "ground_truth": 0}, {"key": "39560618", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.603931823362177, "ground_truth": 0}, {"key": "39560618", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.760650664236615, "ground_truth": 0}, {"key": "39560618", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6740504951439099, "ground_truth": 0}, {"key": "39560618", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.552539733958441, "ground_truth": 0}, {"key": "39560618", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445649876869, "ground_truth": 0}, {"key": "34922693", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.141281420047085, "ground_truth": 0}, {"key": "34922693", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.14511536038602776, "ground_truth": 0}, {"key": "34922693", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.12252321093920598, "ground_truth": 0}, {"key": "34922693", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449275880835301, "ground_truth": 0}, {"key": "34922693", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.19436781918988336, "ground_truth": 0}, {"key": "33629577", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.35936417003241067, "ground_truth": 0}, {"key": "33629577", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5292634232798183, "ground_truth": 0}, {"key": "33629577", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6791786903388717, "ground_truth": 0}, {"key": "33629577", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318232008125, "ground_truth": 0}, {"key": "33629577", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947323777908, "ground_truth": 0}, {"key": "32284359", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5292633680329049, "ground_truth": 0}, {"key": "32284359", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4513264993837705, "ground_truth": 0}, {"key": "32284359", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755879977120136, "ground_truth": 0}, {"key": "32284359", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757645816763533, "ground_truth": 0}, {"key": "32284359", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292634069975318, "ground_truth": 0}, {"key": "28082962", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5698526762476666, "ground_truth": 0}, {"key": "28082962", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37754065506051504, "ground_truth": 0}, {"key": "28082962", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6020615710167463, "ground_truth": 0}, {"key": "28082962", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813031140638503, "ground_truth": 0}, {"key": "28082962", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117165971293343, "ground_truth": 0}, {"key": "24796803", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8469578220941798, "ground_truth": 0}, {"key": "24796803", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7879312129462362, "ground_truth": 0}, {"key": "24796803", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.734119523912699, "ground_truth": 0}, {"key": "24796803", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9412234429902876, "ground_truth": 0}, {"key": "24796803", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759666463689, "ground_truth": 0}, {"key": "35466150", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5813030955618698, "ground_truth": 0}, {"key": "35466150", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6757645883303657, "ground_truth": 0}, {"key": "35466150", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8615382005249942, "ground_truth": 0}, {"key": "35466150", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059232015897, "ground_truth": 0}, {"key": "35466150", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918332414846, "ground_truth": 0}, {"key": "35754289", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8976952949373614, "ground_truth": 0}, {"key": "35754289", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8233283952872426, "ground_truth": 0}, {"key": "35754289", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9073122240933152, "ground_truth": 0}, {"key": "35754289", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872046023643811, "ground_truth": 0}, {"key": "35754289", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297934206258, "ground_truth": 0}, {"key": "36678662", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9230391584971528, "ground_truth": 0}, {"key": "36678662", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9445872066335779, "ground_truth": 0}, {"key": "36678662", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.885631474145035, "ground_truth": 0}, {"key": "36678662", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423130309507, "ground_truth": 0}, {"key": "36678662", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314654896299, "ground_truth": 0}, {"key": "35399671", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9241418217661513, "ground_truth": 0}, {"key": "35399671", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8816149012581594, "ground_truth": 0}, {"key": "35399671", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9213576287581439, "ground_truth": 0}, {"key": "35399671", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767955176365, "ground_truth": 0}, {"key": "35399671", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288422581403, "ground_truth": 0}, {"key": "36888180", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6334102817216581, "ground_truth": 0}, {"key": "36888180", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7201714961257221, "ground_truth": 0}, {"key": "36888180", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8080672256407628, "ground_truth": 0}, {"key": "36888180", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646251498374, "ground_truth": 0}, {"key": "36888180", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300534510371, "ground_truth": 0}, {"key": "28061069", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7154239961862705, "ground_truth": 0}, {"key": "28061069", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4921881468652679, "ground_truth": 0}, {"key": "28061069", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5039061474606057, "ground_truth": 0}, {"key": "28061069", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640225872023, "ground_truth": 0}, {"key": "28061069", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101678530960954, "ground_truth": 0}, {"key": "22259982", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.46490157078160055, "ground_truth": 0}, {"key": "22259982", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4571367299066613, "ground_truth": 0}, {"key": "22259982", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44360043962415263, "ground_truth": 0}, {"key": "22259982", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964245516016, "ground_truth": 0}, {"key": "22259982", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195577433011, "ground_truth": 0}, {"key": "34026805", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8679338478633961, "ground_truth": 0}, {"key": "34026805", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9111797040549567, "ground_truth": 0}, {"key": "34026805", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8489722093047878, "ground_truth": 0}, {"key": "34026805", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063715897144, "ground_truth": 0}, {"key": "34026805", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581534974971, "ground_truth": 0}, {"key": "36713809", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8244619314155491, "ground_truth": 0}, {"key": "36713809", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7745834035495172, "ground_truth": 0}, {"key": "36713809", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7106283045696477, "ground_truth": 0}, {"key": "36713809", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640461018942, "ground_truth": 0}, {"key": "36713809", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324847845662, "ground_truth": 0}, {"key": "39726411", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2782567764337997, "ground_truth": 0}, {"key": "39726411", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2829881305405995, "ground_truth": 0}, {"key": "39726411", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5602526739478106, "ground_truth": 0}, {"key": "39726411", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643509932295, "ground_truth": 0}, {"key": "39726411", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43590150978524816, "ground_truth": 0}, {"key": "37069841", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7534666575265592, "ground_truth": 0}, {"key": "37069841", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7295197609760741, "ground_truth": 0}, {"key": "37069841", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7233094553160226, "ground_truth": 0}, {"key": "37069841", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786110496929, "ground_truth": 0}, {"key": "37069841", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951080855699, "ground_truth": 0}, {"key": "38894693", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6688802312103836, "ground_truth": 0}, {"key": "38894693", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6706082591120024, "ground_truth": 0}, {"key": "38894693", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201715214834318, "ground_truth": 0}, {"key": "38894693", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723834227494, "ground_truth": 0}, {"key": "38894693", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352826369087, "ground_truth": 0}, {"key": "33946032", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.980129285469617, "ground_truth": 0}, {"key": "33946032", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9869795096446182, "ground_truth": 0}, {"key": "33946032", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9825575149621174, "ground_truth": 0}, {"key": "33946032", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.907967145542709, "ground_truth": 0}, {"key": "33946032", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9632305334658919, "ground_truth": 0}, {"key": "39035311", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7416740338143374, "ground_truth": 0}, {"key": "39035311", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7704647916675625, "ground_truth": 0}, {"key": "39035311", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8714748640831228, "ground_truth": 0}, {"key": "39035311", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619343364633, "ground_truth": 0}, {"key": "39035311", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929047248679, "ground_truth": 0}, {"key": "27680038", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.29746991223093794, "ground_truth": 0}, {"key": "27680038", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.32082130910998885, "ground_truth": 0}, {"key": "27680038", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.20946968527091353, "ground_truth": 0}, {"key": "27680038", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.32082131520362855, "ground_truth": 0}, {"key": "27680038", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.13206614718933193, "ground_truth": 0}, {"key": "36901907", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8056321903957528, "ground_truth": 0}, {"key": "36901907", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7386690728870923, "ground_truth": 0}, {"key": "36901907", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7826624771103726, "ground_truth": 0}, {"key": "36901907", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085979355523, "ground_truth": 0}, {"key": "36901907", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.754915012766779, "ground_truth": 0}, {"key": "21530542", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5428633008778724, "ground_truth": 0}, {"key": "21530542", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4726834695630771, "ground_truth": 0}, {"key": "21530542", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3363310466346583, "ground_truth": 0}, {"key": "21530542", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033478754132, "ground_truth": 0}, {"key": "21530542", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082948607355, "ground_truth": 0}, {"key": "38192532", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7786493119504663, "ground_truth": 0}, {"key": "38192532", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.835483546569817, "ground_truth": 0}, {"key": "38192532", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9086178901005112, "ground_truth": 0}, {"key": "38192532", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063664910454, "ground_truth": 0}, {"key": "38192532", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253657327052, "ground_truth": 0}, {"key": "34102400", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.1285251258202534, "ground_truth": 0}, {"key": "34102400", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.15405756659996905, "ground_truth": 0}, {"key": "34102400", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1907240181633304, "ground_truth": 0}, {"key": "34102400", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451645701911255, "ground_truth": 0}, {"key": "34102400", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866939283608594, "ground_truth": 0}, {"key": "36133399", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7969253630674925, "ground_truth": 0}, {"key": "36133399", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.874934622568572, "ground_truth": 0}, {"key": "36133399", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6057990347729338, "ground_truth": 0}, {"key": "36133399", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583113059606, "ground_truth": 0}, {"key": "36133399", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195154960422, "ground_truth": 0}, {"key": "34314544", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702852572249, "ground_truth": 0}, {"key": "34314544", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7520125724272287, "ground_truth": 0}, {"key": "34314544", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7264256210480982, "ground_truth": 0}, {"key": "34314544", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300593516851, "ground_truth": 0}, {"key": "34314544", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056197423963, "ground_truth": 0}, {"key": "33460074", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7981867811734532, "ground_truth": 0}, {"key": "33460074", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195565802265, "ground_truth": 0}, {"key": "33460074", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7704647936982103, "ground_truth": 0}, {"key": "33460074", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754444790095, "ground_truth": 0}, {"key": "33460074", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187368012967327, "ground_truth": 0}, {"key": "36191495", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3174262815972471, "ground_truth": 0}, {"key": "36191495", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3665897501787258, "ground_truth": 0}, {"key": "36191495", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3191213878459521, "ground_truth": 0}, {"key": "36191495", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468964883911, "ground_truth": 0}, {"key": "36191495", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004009717154, "ground_truth": 0}, {"key": "39532668", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9012274041195344, "ground_truth": 0}, {"key": "39532668", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8499711670907047, "ground_truth": 0}, {"key": "39532668", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837788263417, "ground_truth": 0}, {"key": "39532668", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210761519135, "ground_truth": 0}, {"key": "39532668", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884451475695, "ground_truth": 0}, {"key": "20328247", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3276682841064341, "ground_truth": 0}, {"key": "20328247", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2538610128159514, "ground_truth": 0}, {"key": "20328247", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2829881034403589, "ground_truth": 0}, {"key": "20328247", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46295859321569754, "ground_truth": 0}, {"key": "20328247", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015278375168, "ground_truth": 0}, {"key": "39112675", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.653126927808208, "ground_truth": 0}, {"key": "39112675", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.588889146491379, "ground_truth": 0}, {"key": "39112675", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6723316763844263, "ground_truth": 0}, {"key": "39112675", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317095865459, "ground_truth": 0}, {"key": "39112675", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791878549492, "ground_truth": 0}, {"key": "31620300", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6206216155075873, "ground_truth": 0}, {"key": "31620300", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5136684472183547, "ground_truth": 0}, {"key": "31620300", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5486734715346394, "ground_truth": 0}, {"key": "31620300", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665721304901, "ground_truth": 0}, {"key": "31620300", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964381455296, "ground_truth": 0}, {"key": "37518509", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011274390248, "ground_truth": 0}, {"key": "37518509", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4359014966701139, "ground_truth": 0}, {"key": "37518509", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3702253660891564, "ground_truth": 0}, {"key": "37518509", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864513882639464, "ground_truth": 0}, {"key": "37518509", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711486383216, "ground_truth": 0}, {"key": "35454095", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7185943955789788, "ground_truth": 0}, {"key": "35454095", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8714748627943071, "ground_truth": 0}, {"key": "35454095", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8679338451241215, "ground_truth": 0}, {"key": "35454095", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166072148897, "ground_truth": 0}, {"key": "35454095", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431911730785, "ground_truth": 0}, {"key": "38542788", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9241418196410683, "ground_truth": 0}, {"key": "38542788", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9278877956714027, "ground_truth": 0}, {"key": "38542788", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.953275038879099, "ground_truth": 0}, {"key": "38542788", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9559813511292596, "ground_truth": 0}, {"key": "38542788", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.949669370065671, "ground_truth": 0}, {"key": "23944937", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6334102714868003, "ground_truth": 0}, {"key": "23944937", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5813031062131413, "ground_truth": 0}, {"key": "23944937", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6388352525169748, "ground_truth": 0}, {"key": "23944937", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585814326198, "ground_truth": 0}, {"key": "23944937", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105704251888, "ground_truth": 0}, {"key": "31753944", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48047867497240215, "ground_truth": 0}, {"key": "31753944", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47463116656705906, "ground_truth": 0}, {"key": "31753944", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4359015293219811, "ground_truth": 0}, {"key": "31753944", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552952662740997, "ground_truth": 0}, {"key": "31753944", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473474374607, "ground_truth": 0}, {"key": "35527214", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5019530860766144, "ground_truth": 0}, {"key": "35527214", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.640635834050049, "ground_truth": 0}, {"key": "35527214", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6723317095180245, "ground_truth": 0}, {"key": "35527214", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802394443353, "ground_truth": 0}, {"key": "35527214", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736783990490711, "ground_truth": 0}, {"key": "40400404", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9618217261937877, "ground_truth": 0}, {"key": "40400404", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9449947049495441, "ground_truth": 0}, {"key": "40400404", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9575961724671078, "ground_truth": 0}, {"key": "40400404", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037275106325, "ground_truth": 0}, {"key": "40400404", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9284088002080778, "ground_truth": 0}, {"key": "21713119", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.24798742882361235, "ground_truth": 0}, {"key": "21713119", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2005576846143464, "ground_truth": 0}, {"key": "21713119", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5273165143867194, "ground_truth": 0}, {"key": "21713119", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634491785815, "ground_truth": 0}, {"key": "21713119", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487867314948, "ground_truth": 0}, {"key": "28730678", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9111797150769388, "ground_truth": 0}, {"key": "28730678", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8175744744552084, "ground_truth": 0}, {"key": "28730678", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.766293639037986, "ground_truth": 0}, {"key": "28730678", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142444052414, "ground_truth": 0}, {"key": "28730678", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.801935834597955, "ground_truth": 0}, {"key": "36823733", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7690802219386397, "ground_truth": 0}, {"key": "36823733", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5253688167103591, "ground_truth": 0}, {"key": "36823733", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.747615954260542, "ground_truth": 0}, {"key": "36823733", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191370876683, "ground_truth": 0}, {"key": "36823733", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512785905601, "ground_truth": 0}, {"key": "35988862", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4474602848842676, "ground_truth": 0}, {"key": "35988862", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.46684558903848045, "ground_truth": 0}, {"key": "35988862", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4863315340594092, "ground_truth": 0}, {"key": "35988862", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.31069439827976536, "ground_truth": 0}, {"key": "35988862", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367066959506, "ground_truth": 0}, {"key": "40499665", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9407897492497, "ground_truth": 0}, {"key": "40499665", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9118099637870367, "ground_truth": 0}, {"key": "40499665", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8918110472710444, "ground_truth": 0}, {"key": "40499665", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9453993951080238, "ground_truth": 0}, {"key": "40499665", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222918903829, "ground_truth": 0}, {"key": "32829820", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8509646988835343, "ground_truth": 0}, {"key": "32829820", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4571367060702354, "ground_truth": 0}, {"key": "32829820", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6460136856612301, "ground_truth": 0}, {"key": "32829820", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672066937964, "ground_truth": 0}, {"key": "32829820", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666563243586, "ground_truth": 0}, {"key": "20583553", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.20181321433667562, "ground_truth": 0}, {"key": "20583553", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.08449275587715925, "ground_truth": 0}, {"key": "20583553", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.11279539647418667, "ground_truth": 0}, {"key": "20583553", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689404600730518, "ground_truth": 0}, {"key": "20583553", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689405225001772, "ground_truth": 0}, {"key": "30501550", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8624675217075991, "ground_truth": 0}, {"key": "30501550", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.783988466647155, "ground_truth": 0}, {"key": "30501550", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8633916158994027, "ground_truth": 0}, {"key": "30501550", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036238194439, "ground_truth": 0}, {"key": "30501550", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840563581793, "ground_truth": 0}, {"key": "38755897", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7505527537060867, "ground_truth": 0}, {"key": "38755897", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6893056338998583, "ground_truth": 0}, {"key": "38755897", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7839884755398077, "ground_truth": 0}, {"key": "38755897", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321720399445, "ground_truth": 0}, {"key": "38755897", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437748341486, "ground_truth": 0}, {"key": "35507201", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5467381339419046, "ground_truth": 0}, {"key": "35507201", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8407825834713835, "ground_truth": 0}, {"key": "35507201", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6740504642139487, "ground_truth": 0}, {"key": "35507201", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118890405151, "ground_truth": 0}, {"key": "35507201", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881483940576, "ground_truth": 0}, {"key": "36453511", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8895288493823214, "ground_truth": 0}, {"key": "36453511", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8519528014328225, "ground_truth": 0}, {"key": "36453511", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8333246184781761, "ground_truth": 0}, {"key": "36453511", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037369348947, "ground_truth": 0}, {"key": "36453511", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099480491334, "ground_truth": 0}, {"key": "38066835", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7634837671021577, "ground_truth": 0}, {"key": "38066835", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7201715153231905, "ground_truth": 0}, {"key": "38066835", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7918210763497983, "ground_truth": 0}, {"key": "38066835", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059611386091, "ground_truth": 0}, {"key": "38066835", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068941866056, "ground_truth": 0}, {"key": "39697181", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6242935111303229, "ground_truth": 0}, {"key": "39697181", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238910489137, "ground_truth": 0}, {"key": "39697181", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6242935466797062, "ground_truth": 0}, {"key": "39697181", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935149681539, "ground_truth": 0}, {"key": "39697181", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102563744198, "ground_truth": 0}, {"key": "21820893", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7170118884638731, "ground_truth": 0}, {"key": "21820893", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7759445501723674, "ground_truth": 0}, {"key": "21820893", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201714997537588, "ground_truth": 0}, {"key": "21820893", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585843116975, "ground_truth": 0}, {"key": "21820893", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647011829026, "ground_truth": 0}, {"key": "40519933", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445482014241, "ground_truth": 0}, {"key": "40519933", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5698526673250931, "ground_truth": 0}, {"key": "40519933", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6279512298291235, "ground_truth": 0}, {"key": "40519933", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666149418146, "ground_truth": 0}, {"key": "40519933", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666616283763, "ground_truth": 0}, {"key": "30446033", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7122321997186151, "ground_truth": 0}, {"key": "30446033", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7853085706008521, "ground_truth": 0}, {"key": "30446033", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8233283862148956, "ground_truth": 0}, {"key": "30446033", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869837715783, "ground_truth": 0}, {"key": "30446033", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267793490603, "ground_truth": 0}, {"key": "40216291", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6926419821603167, "ground_truth": 0}, {"key": "40216291", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8879840426335822, "ground_truth": 0}, {"key": "40216291", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8895288474825377, "ground_truth": 0}, {"key": "40216291", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314747252197, "ground_truth": 0}, {"key": "40216291", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288406249477, "ground_truth": 0}, {"key": "33479118", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.34158249176745237, "ground_truth": 0}, {"key": "33479118", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4746311900853279, "ground_truth": 0}, {"key": "33479118", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "33479118", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.48242910621687046, "ground_truth": 0}, {"key": "33479118", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285232689006206, "ground_truth": 0}, {"key": "22297373", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4455295288724861, "ground_truth": 0}, {"key": "22297373", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.18242553317302068, "ground_truth": 0}, {"key": "22297373", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.21733752304069617, "ground_truth": 0}, {"key": "22297373", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237001767778955, "ground_truth": 0}, {"key": "22297373", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1431877106550519, "ground_truth": 0}, {"key": "36463668", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.1732881981862113, "ground_truth": 0}, {"key": "36463668", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5019531184974616, "ground_truth": 0}, {"key": "36463668", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30239107507120616, "ground_truth": 0}, {"key": "36463668", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1847675021572076, "ground_truth": 0}, {"key": "36463668", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667160153716646, "ground_truth": 0}, {"key": "35264615", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7505527552399933, "ground_truth": 0}, {"key": "35264615", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7759445311117996, "ground_truth": 0}, {"key": "35264615", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3242353694301646, "ground_truth": 0}, {"key": "35264615", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.757794370472148, "ground_truth": 0}, {"key": "35264615", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121871082855, "ground_truth": 0}, {"key": "39898482", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9458012763203124, "ground_truth": 0}, {"key": "39898482", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9252299484493964, "ground_truth": 0}, {"key": "39898482", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9124361533200489, "ground_truth": 0}, {"key": "39898482", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111796966783844, "ground_truth": 0}, {"key": "39898482", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898246299585, "ground_truth": 0}, {"key": "37228721", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6825737300418614, "ground_truth": 0}, {"key": "37228721", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256022729659, "ground_truth": 0}, {"key": "37228721", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7718434842922903, "ground_truth": 0}, {"key": "37228721", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.71701189028818, "ground_truth": 0}, {"key": "37228721", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476820703595, "ground_truth": 0}, {"key": "24535799", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9783846694852908, "ground_truth": 0}, {"key": "24535799", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9556514174686667, "ground_truth": 0}, {"key": "24535799", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9136765172067642, "ground_truth": 0}, {"key": "24535799", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072535647653, "ground_truth": 0}, {"key": "24535799", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314738958025, "ground_truth": 0}, {"key": "35177759", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8469578363377791, "ground_truth": 0}, {"key": "35177759", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6976088919855375, "ground_truth": 0}, {"key": "35177759", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8031737879614989, "ground_truth": 0}, {"key": "35177759", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872299268333, "ground_truth": 0}, {"key": "35177759", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675233185665, "ground_truth": 0}, {"key": "34364829", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7074046760405714, "ground_truth": 0}, {"key": "34364829", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7648916002804936, "ground_truth": 0}, {"key": "34364829", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.71542400800723, "ground_truth": 0}, {"key": "34364829", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.562176523292056, "ground_truth": 0}, {"key": "34364829", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526797839457, "ground_truth": 0}, {"key": "38090732", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8509647048512728, "ground_truth": 0}, {"key": "38090732", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8872046058793479, "ground_truth": 0}, {"key": "38090732", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6513548612802474, "ground_truth": 0}, {"key": "38090732", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366560566962, "ground_truth": 0}, {"key": "38090732", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528083632091, "ground_truth": 0}, {"key": "30651479", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7264256058923125, "ground_truth": 0}, {"key": "30651479", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8068526259237659, "ground_truth": 0}, {"key": "30651479", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8175744724384995, "ground_truth": 0}, {"key": "30651479", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367885686365, "ground_truth": 0}, {"key": "30651479", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.753466646597751, "ground_truth": 0}, {"key": "39380921", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.474631195625373, "ground_truth": 0}, {"key": "39380921", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.16885695998293368, "ground_truth": 0}, {"key": "39380921", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31237000238944795, "ground_truth": 0}, {"key": "39380921", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734957635173, "ground_truth": 0}, {"key": "39380921", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398389030267, "ground_truth": 0}, {"key": "39037490", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.19806417626105044, "ground_truth": 0}, {"key": "39037490", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2120688071765456, "ground_truth": 0}, {"key": "39037490", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.14128141934901015, "ground_truth": 0}, {"key": "39037490", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.15507846924204413, "ground_truth": 0}, {"key": "39037490", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669059278947005, "ground_truth": 0}, {"key": "35917499", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8509647069312031, "ground_truth": 0}, {"key": "35917499", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8832359845845584, "ground_truth": 0}, {"key": "35917499", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.857768106986225, "ground_truth": 0}, {"key": "35917499", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306357854956, "ground_truth": 0}, {"key": "35917499", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122206348802, "ground_truth": 0}, {"key": "34908073", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8267117787977226, "ground_truth": 0}, {"key": "34908073", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6352224299777715, "ground_truth": 0}, {"key": "34908073", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.564098487175263, "ground_truth": 0}, {"key": "34908073", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094609576562, "ground_truth": 0}, {"key": "34908073", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.569852671829482, "ground_truth": 0}, {"key": "36344759", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8606036144843415, "ground_truth": 0}, {"key": "36344759", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5136684852326406, "ground_truth": 0}, {"key": "36344759", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7122321781096517, "ground_truth": 0}, {"key": "36344759", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441045319293, "ground_truth": 0}, {"key": "36344759", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256516697158, "ground_truth": 0}, {"key": "39984637", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5945512372810138, "ground_truth": 0}, {"key": "39984637", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7057850301168264, "ground_truth": 0}, {"key": "39984637", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40922080343170675, "ground_truth": 0}, {"key": "39984637", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590151006760397, "ground_truth": 0}, {"key": "39984637", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167300029128403, "ground_truth": 0}, {"key": "17917326", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5195213258145162, "ground_truth": 0}, {"key": "17917326", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48438008753443673, "ground_truth": 0}, {"key": "17917326", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6150878475006976, "ground_truth": 0}, {"key": "17917326", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548596075958, "ground_truth": 0}, {"key": "17917326", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.509764355147238, "ground_truth": 0}, {"key": "32193638", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6001883778715676, "ground_truth": 0}, {"key": "32193638", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6688802741281107, "ground_truth": 0}, {"key": "32193638", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.571766602009524, "ground_truth": 0}, {"key": "32193638", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494565363552, "ground_truth": 0}, {"key": "32193638", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241763278922, "ground_truth": 0}, {"key": "34564692", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.692641991204251, "ground_truth": 0}, {"key": "34564692", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7772998771578018, "ground_truth": 0}, {"key": "34564692", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7025300642293083, "ground_truth": 0}, {"key": "34564692", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545393046643, "ground_truth": 0}, {"key": "34564692", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527561723572, "ground_truth": 0}, {"key": "39329284", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.989671846381038, "ground_truth": 0}, {"key": "39329284", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.790530316915743, "ground_truth": 0}, {"key": "39329284", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9838471653645811, "ground_truth": 0}, {"key": "39329284", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9890130563821369, "ground_truth": 0}, {"key": "39329284", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.992304352536281, "ground_truth": 0}, {"key": "37438541", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7386690705006287, "ground_truth": 0}, {"key": "37438541", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5370413957106245, "ground_truth": 0}, {"key": "37438541", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4301473505030034, "ground_truth": 0}, {"key": "37438541", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3720487928498297, "ground_truth": 0}, {"key": "37438541", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414002353486, "ground_truth": 0}, {"key": "34652757", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7956581147735754, "ground_truth": 0}, {"key": "34652757", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8783142348735525, "ground_truth": 0}, {"key": "34652757", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7892336854451067, "ground_truth": 0}, {"key": "34652757", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872045870175435, "ground_truth": 0}, {"key": "34652757", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.838679746618023, "ground_truth": 0}, {"key": "31361004", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3886180338128486, "ground_truth": 0}, {"key": "31361004", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942996879189, "ground_truth": 0}, {"key": "31361004", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8872045999187597, "ground_truth": 0}, {"key": "31361004", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.911809956436562, "ground_truth": 0}, {"key": "31361004", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256092062558, "ground_truth": 0}, {"key": "26150727", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.403566881235467, "ground_truth": 0}, {"key": "26150727", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238605984285, "ground_truth": 0}, {"key": "26150727", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5660185383465763, "ground_truth": 0}, {"key": "26150727", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366025360962, "ground_truth": 0}, {"key": "26150727", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432032227183, "ground_truth": 0}, {"key": "36997402", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702749207759, "ground_truth": 0}, {"key": "36997402", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8577681070473319, "ground_truth": 0}, {"key": "36997402", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755879933959593, "ground_truth": 0}, {"key": "36997402", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191436710316, "ground_truth": 0}, {"key": "36997402", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583126062701, "ground_truth": 0}, {"key": "37430643", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.33285232187739555, "ground_truth": 0}, {"key": "37430643", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5078118924173283, "ground_truth": 0}, {"key": "37430643", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4378235145885507, "ground_truth": 0}, {"key": "37430643", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4397473289685035, "ground_truth": 0}, {"key": "37430643", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41489881971375875, "ground_truth": 0}, {"key": "36964631", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6279512148999066, "ground_truth": 0}, {"key": "36964631", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7905303138320325, "ground_truth": 0}, {"key": "36964631", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6513548871757862, "ground_truth": 0}, {"key": "36964631", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527585284538, "ground_truth": 0}, {"key": "36964631", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175709140899094, "ground_truth": 0}, {"key": "35502013", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6791786888926866, "ground_truth": 0}, {"key": "35502013", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7008948206071242, "ground_truth": 0}, {"key": "35502013", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.653126917631209, "ground_truth": 0}, {"key": "35502013", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102778021629, "ground_truth": 0}, {"key": "35502013", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013753008265, "ground_truth": 0}, {"key": "33987664", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6406358793180544, "ground_truth": 0}, {"key": "33987664", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8652240686662626, "ground_truth": 0}, {"key": "33987664", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7279754608789367, "ground_truth": 0}, {"key": "33987664", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891174329305, "ground_truth": 0}, {"key": "33987664", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382060707325, "ground_truth": 0}, {"key": "35203721", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6001883555752169, "ground_truth": 0}, {"key": "35203721", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6242935616477716, "ground_truth": 0}, {"key": "35203721", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7295197767379027, "ground_truth": 0}, {"key": "35203721", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195134921414, "ground_truth": 0}, {"key": "35203721", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073480662464, "ground_truth": 0}, {"key": "39028348", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8056321837256429, "ground_truth": 0}, {"key": "39028348", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.569852662986738, "ground_truth": 0}, {"key": "39028348", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8529354740356374, "ground_truth": 0}, {"key": "39028348", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.860603611805889, "ground_truth": 0}, {"key": "39028348", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918256997684, "ground_truth": 0}, {"key": "37459383", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.868826790700861, "ground_truth": 0}, {"key": "37459383", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.887204606388558, "ground_truth": 0}, {"key": "37459383", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8872045848284277, "ground_truth": 0}, {"key": "37459383", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.834406882495747, "ground_truth": 0}, {"key": "37459383", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675313592911, "ground_truth": 0}, {"key": "34020070", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872139738358, "ground_truth": 0}, {"key": "34020070", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6206216067744503, "ground_truth": 0}, {"key": "34020070", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6113819830920291, "ground_truth": 0}, {"key": "34020070", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998497866737, "ground_truth": 0}, {"key": "34020070", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615791933358, "ground_truth": 0}, {"key": "35176615", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8267117981656551, "ground_truth": 0}, {"key": "35176615", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7759445367024841, "ground_truth": 0}, {"key": "35176615", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5253688300748051, "ground_truth": 0}, {"key": "35176615", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.640635852820294, "ground_truth": 0}, {"key": "35176615", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336886063773, "ground_truth": 0}, {"key": "33296389", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.80440591983378, "ground_truth": 0}, {"key": "33296389", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8679338473943455, "ground_truth": 0}, {"key": "33296389", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7341195436777779, "ground_truth": 0}, {"key": "33296389", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324912583357, "ground_truth": 0}, {"key": "33296389", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324817074634, "ground_truth": 0}, {"key": "35399504", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9412234387278839, "ground_truth": 0}, {"key": "35399504", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9257686350943248, "ground_truth": 0}, {"key": "35399504", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9339146271021663, "ground_truth": 0}, {"key": "35399504", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9458012643859527, "ground_truth": 0}, {"key": "35399504", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505339671522, "ground_truth": 0}, {"key": "34807886", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.21206881044060893, "ground_truth": 0}, {"key": "34807886", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.16132023851542862, "ground_truth": 0}, {"key": "34807886", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3208213079679744, "ground_truth": 0}, {"key": "34807886", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238405141647824, "ground_truth": 0}, {"key": "34807886", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.550607348803939, "ground_truth": 0}, {"key": "37629813", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6057990521487442, "ground_truth": 0}, {"key": "37629813", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786179868931, "ground_truth": 0}, {"key": "37629813", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8365545713910255, "ground_truth": 0}, {"key": "37629813", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.670608300480609, "ground_truth": 0}, {"key": "37629813", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398150028861937, "ground_truth": 0}, {"key": "28084389", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8449215264802553, "ground_truth": 0}, {"key": "28084389", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9059898138015293, "ground_truth": 0}, {"key": "28084389", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7690802495080754, "ground_truth": 0}, {"key": "28084389", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9416541547656261, "ground_truth": 0}, {"key": "28084389", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361581414255, "ground_truth": 0}, {"key": "35391734", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7648916132619248, "ground_truth": 0}, {"key": "35391734", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8615382062062897, "ground_truth": 0}, {"key": "35391734", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8577681147212013, "ground_truth": 0}, {"key": "35391734", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933789126116, "ground_truth": 0}, {"key": "35391734", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423486071527, "ground_truth": 0}, {"key": "40214591", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6601723942483725, "ground_truth": 0}, {"key": "40214591", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.620621632353058, "ground_truth": 0}, {"key": "40214591", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5370413877647856, "ground_truth": 0}, {"key": "40214591", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463118317182273, "ground_truth": 0}, {"key": "40214591", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224293164719, "ground_truth": 0}, {"key": "26283171", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8019358356503001, "ground_truth": 0}, {"key": "26283171", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8300437529529933, "ground_truth": 0}, {"key": "26283171", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.721743212822517, "ground_truth": 0}, {"key": "26283171", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311856999575, "ground_truth": 0}, {"key": "26283171", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311987308195, "ground_truth": 0}, {"key": "37084030", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3259494944460784, "ground_truth": 0}, {"key": "37084030", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2720245617739567, "ground_truth": 0}, {"key": "37084030", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.16559311686391093, "ground_truth": 0}, {"key": "37084030", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660839041050798, "ground_truth": 0}, {"key": "37084030", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074558900083165, "ground_truth": 0}, {"key": "39027295", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.28140560304640044, "ground_truth": 0}, {"key": "39027295", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.31237002988993195, "ground_truth": 0}, {"key": "39027295", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43014734108020863, "ground_truth": 0}, {"key": "39027295", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030856510991, "ground_truth": 0}, {"key": "39027295", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720488149688106, "ground_truth": 0}, {"key": "14018647", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.27825678701144685, "ground_truth": 0}, {"key": "14018647", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.34864514742389074, "ground_truth": 0}, {"key": "14018647", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30902370794744655, "ground_truth": 0}, {"key": "14018647", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.315735964538077, "ground_truth": 0}, {"key": "14018647", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206880993268218, "ground_truth": 0}, {"key": "37424289", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8848377845921936, "ground_truth": 0}, {"key": "37424289", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9726235092707258, "ground_truth": 0}, {"key": "37424289", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9394706193491568, "ground_truth": 0}, {"key": "37424289", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9706877700838236, "ground_truth": 0}, {"key": "37424289", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9390248228744619, "ground_truth": 0}, {"key": "37498031", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.494140913517334, "ground_truth": 0}, {"key": "37498031", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6442251053226019, "ground_truth": 0}, {"key": "37498031", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4551986211765683, "ground_truth": 0}, {"key": "37498031", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665895096035, "ground_truth": 0}, {"key": "37498031", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167993303272, "ground_truth": 0}, {"key": "30104095", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7170118679229166, "ground_truth": 0}, {"key": "30104095", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185559457699, "ground_truth": 0}, {"key": "30104095", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6315942877397983, "ground_truth": 0}, {"key": "30104095", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746043370823, "ground_truth": 0}, {"key": "30104095", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203447478879, "ground_truth": 0}, {"key": "37911407", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9032942062883242, "ground_truth": 0}, {"key": "37911407", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9651191156514803, "ground_truth": 0}, {"key": "37911407", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9462003567978854, "ground_truth": 0}, {"key": "37911407", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9753900705830433, "ground_truth": 0}, {"key": "37911407", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9362850100006819, "ground_truth": 0}, {"key": "39177472", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7662936254004471, "ground_truth": 0}, {"key": "39177472", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7690802620431695, "ground_truth": 0}, {"key": "39177472", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8615382102563095, "ground_truth": 0}, {"key": "39177472", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.744656349848907, "ground_truth": 0}, {"key": "39177472", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346183843906, "ground_truth": 0}, {"key": "32325454", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9588471123750246, "ground_truth": 0}, {"key": "32325454", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8962513770565506, "ground_truth": 0}, {"key": "32325454", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8976953055651022, "ground_truth": 0}, {"key": "32325454", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284087998172332, "ground_truth": 0}, {"key": "32325454", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8887587995746177, "ground_truth": 0}, {"key": "38395319", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8187368019035101, "ground_truth": 0}, {"key": "38395319", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6859494373756984, "ground_truth": 0}, {"key": "38395319", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7233094626825085, "ground_truth": 0}, {"key": "38395319", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909763061149915, "ground_truth": 0}, {"key": "38395319", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.718594406512301, "ground_truth": 0}, {"key": "38235895", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3923368335658116, "ground_truth": 0}, {"key": "38235895", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5136684821027239, "ground_truth": 0}, {"key": "38235895", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.48047868420084966, "ground_truth": 0}, {"key": "38235895", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387581177292717, "ground_truth": 0}, {"key": "38235895", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463118846856817, "ground_truth": 0}, {"key": "26543267", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3539862934772454, "ground_truth": 0}, {"key": "26543267", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5370413612190784, "ground_truth": 0}, {"key": "26543267", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5195213352714977, "ground_truth": 0}, {"key": "26543267", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473515084132, "ground_truth": 0}, {"key": "26543267", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191575238728, "ground_truth": 0}, {"key": "39054728", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9930961615214082, "ground_truth": 0}, {"key": "39054728", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9791955079955407, "ground_truth": 0}, {"key": "39054728", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.986151389751539, "ground_truth": 0}, {"key": "39054728", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.989671847609317, "ground_truth": 0}, {"key": "39054728", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9849273720272808, "ground_truth": 0}, {"key": "39158443", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8848377731008915, "ground_truth": 0}, {"key": "39158443", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7853085873473086, "ground_truth": 0}, {"key": "39158443", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8187367831823665, "ground_truth": 0}, {"key": "39158443", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.900529781936437, "ground_truth": 0}, {"key": "39158443", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619256586002, "ground_truth": 0}, {"key": "36254201", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011925668365, "ground_truth": 0}, {"key": "36254201", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2643583606292034, "ground_truth": 0}, {"key": "36254201", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3684057070972468, "ground_truth": 0}, {"key": "36254201", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020616097747419, "ground_truth": 0}, {"key": "36254201", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398148436234346, "ground_truth": 0}, {"key": "23434347", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5640984874821892, "ground_truth": 0}, {"key": "23434347", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.31742626808033303, "ground_truth": 0}, {"key": "23434347", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6187804085053941, "ground_truth": 0}, {"key": "23434347", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288170034249, "ground_truth": 0}, {"key": "23434347", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241516390396, "ground_truth": 0}, {"key": "34397620", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3611647306080596, "ground_truth": 0}, {"key": "34397620", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4301473394819119, "ground_truth": 0}, {"key": "34397620", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3380771170551872, "ground_truth": 0}, {"key": "34397620", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43206339495160406, "ground_truth": 0}, {"key": "34397620", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378235153058449, "ground_truth": 0}, {"key": "34340916", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5774953364662566, "ground_truth": 0}, {"key": "34340916", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.622459358525101, "ground_truth": 0}, {"key": "34340916", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36296922486503347, "ground_truth": 0}, {"key": "34340916", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.594551259494434, "ground_truth": 0}, {"key": "34340916", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984227097897, "ground_truth": 0}, {"key": "30375089", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.735641647820231, "ground_truth": 0}, {"key": "30375089", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6636689307451414, "ground_truth": 0}, {"key": "30375089", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6926419859165889, "ground_truth": 0}, {"key": "30375089", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765110469621, "ground_truth": 0}, {"key": "30375089", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578338664365, "ground_truth": 0}, {"key": "35807797", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8856314745276107, "ground_truth": 0}, {"key": "35807797", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4687906148749408, "ground_truth": 0}, {"key": "35807797", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.895522687576835, "ground_truth": 0}, {"key": "35807797", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314669386596, "ground_truth": 0}, {"key": "35807797", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9339146253366535, "ground_truth": 0}, {"key": "34188172", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7839884602500682, "ground_truth": 0}, {"key": "34188172", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6150878446649686, "ground_truth": 0}, {"key": "34188172", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837503019143, "ground_truth": 0}, {"key": "34188172", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185820077646, "ground_truth": 0}, {"key": "34188172", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358765277401, "ground_truth": 0}, {"key": "37075567", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9246876927470127, "ground_truth": 0}, {"key": "37075567", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.885631476094648, "ground_truth": 0}, {"key": "37075567", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.931959583466928, "ground_truth": 0}, {"key": "37075567", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.880797068473731, "ground_truth": 0}, {"key": "37075567", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149144557385, "ground_truth": 0}, {"key": "35559735", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6039318401543734, "ground_truth": 0}, {"key": "35559735", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5907792040981932, "ground_truth": 0}, {"key": "35559735", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.79692537878983, "ground_truth": 0}, {"key": "35559735", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786762641778, "ground_truth": 0}, {"key": "35559735", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441265094742, "ground_truth": 0}, {"key": "33005019", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5544704598454832, "ground_truth": 0}, {"key": "33005019", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2925953057968236, "ground_truth": 0}, {"key": "33005019", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8300437809930963, "ground_truth": 0}, {"key": "33005019", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850251730328, "ground_truth": 0}, {"key": "33005019", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632762105482, "ground_truth": 0}, {"key": "30808252", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5774953875364686, "ground_truth": 0}, {"key": "30808252", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819879795106, "ground_truth": 0}, {"key": "30808252", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5350984180578068, "ground_truth": 0}, {"key": "30808252", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935177968286, "ground_truth": 0}, {"key": "30808252", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46295860938321737, "ground_truth": 0}, {"key": "15159017", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47852885553479096, "ground_truth": 0}, {"key": "15159017", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6242935407330981, "ground_truth": 0}, {"key": "15159017", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.752012551257605, "ground_truth": 0}, {"key": "15159017", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476825169605, "ground_truth": 0}, {"key": "15159017", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197872712968, "ground_truth": 0}, {"key": "24493400", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4882833770589962, "ground_truth": 0}, {"key": "24493400", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238918038543, "ground_truth": 0}, {"key": "24493400", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6424324762044624, "ground_truth": 0}, {"key": "24493400", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132652026039805, "ground_truth": 0}, {"key": "24493400", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125768384209, "ground_truth": 0}, {"key": "37791071", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.815232501255364, "ground_truth": 0}, {"key": "37791071", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.809275977303357, "ground_truth": 0}, {"key": "37791071", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9207896768926954, "ground_truth": 0}, {"key": "37791071", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744765366875, "ground_truth": 0}, {"key": "37791071", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437594309992, "ground_truth": 0}, {"key": "33528627", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8933094072537434, "ground_truth": 0}, {"key": "33528627", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7356416321518991, "ground_truth": 0}, {"key": "33528627", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8407825830762831, "ground_truth": 0}, {"key": "33528627", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593175676836, "ground_truth": 0}, {"key": "33528627", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253990266783, "ground_truth": 0}, {"key": "39925662", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7994423180925394, "ground_truth": 0}, {"key": "39925662", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8679338355749028, "ground_truth": 0}, {"key": "39925662", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9019206747428093, "ground_truth": 0}, {"key": "39925662", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690702653281, "ground_truth": 0}, {"key": "39925662", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127520591283, "ground_truth": 0}, {"key": "29213416", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.17667160625749057, "ground_truth": 0}, {"key": "29213416", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.396068171642397, "ground_truth": 0}, {"key": "29213416", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3380771299644588, "ground_truth": 0}, {"key": "29213416", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633907663902, "ground_truth": 0}, {"key": "29213416", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3433417192044868, "ground_truth": 0}, {"key": "34492745", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31573600651568307, "ground_truth": 0}, {"key": "34492745", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.28457598549810137, "ground_truth": 0}, {"key": "34492745", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.28776780607298985, "ground_truth": 0}, {"key": "34492745", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918303517732, "ground_truth": 0}, {"key": "34492745", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093747151346, "ground_truth": 0}, {"key": "34191937", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6943026754720134, "ground_truth": 0}, {"key": "34191937", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2829880940292439, "ground_truth": 0}, {"key": "34191937", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4882833946575538, "ground_truth": 0}, {"key": "34191937", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632160886797044, "ground_truth": 0}, {"key": "34191937", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033416010528, "ground_truth": 0}, {"key": "34933372", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7704647990229986, "ground_truth": 0}, {"key": "34933372", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8365545626903903, "ground_truth": 0}, {"key": "34933372", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.76489159524387, "ground_truth": 0}, {"key": "34933372", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884759470869, "ground_truth": 0}, {"key": "34933372", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416055229542, "ground_truth": 0}, {"key": "38714379", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9507778845326094, "ground_truth": 0}, {"key": "38714379", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8740772401294221, "ground_truth": 0}, {"key": "38714379", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9609517057621004, "ground_truth": 0}, {"key": "38714379", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142526367372, "ground_truth": 0}, {"key": "38714379", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632870695587, "ground_truth": 0}, {"key": "39220660", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7826624970533061, "ground_truth": 0}, {"key": "39220660", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8705972610269841, "ground_truth": 0}, {"key": "39220660", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8548846319485116, "ground_truth": 0}, {"key": "39220660", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104356302582, "ground_truth": 0}, {"key": "39220660", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528088307817, "ground_truth": 0}, {"key": "41028780", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6242935314740007, "ground_truth": 0}, {"key": "41028780", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7170118769565185, "ground_truth": 0}, {"key": "41028780", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6619228905374014, "ground_truth": 0}, {"key": "41028780", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601330755128, "ground_truth": 0}, {"key": "41028780", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315942692224207, "ground_truth": 0}, {"key": "39457108", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5175709063545761, "ground_truth": 0}, {"key": "39457108", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37754069307879695, "ground_truth": 0}, {"key": "39457108", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5486734870347449, "ground_truth": 0}, {"key": "39457108", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.675764585538758, "ground_truth": 0}, {"key": "39457108", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059630002494, "ground_truth": 0}, {"key": "38288018", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.12336561856522948, "ground_truth": 0}, {"key": "38288018", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22405547345648316, "ground_truth": 0}, {"key": "38288018", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31912140135091505, "ground_truth": 0}, {"key": "38288018", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.13753246570905894, "ground_truth": 0}, {"key": "38288018", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1441488527674698, "ground_truth": 0}, {"key": "40106293", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31405051966829134, "ground_truth": 0}, {"key": "40106293", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.44939262665328306, "ground_truth": 0}, {"key": "40106293", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.25832597207490166, "ground_truth": 0}, {"key": "40106293", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406640647787, "ground_truth": 0}, {"key": "40106293", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4054487062158091, "ground_truth": 0}, {"key": "39948797", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6893056417369966, "ground_truth": 0}, {"key": "39948797", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9086179042791427, "ground_truth": 0}, {"key": "39948797", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6206216445320284, "ground_truth": 0}, {"key": "39948797", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358412832225, "ground_truth": 0}, {"key": "39948797", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760402695131, "ground_truth": 0}, {"key": "31853399", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.84796776543065, "ground_truth": 0}, {"key": "31853399", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.77321636117879, "ground_truth": 0}, {"key": "31853399", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8031737907905978, "ground_truth": 0}, {"key": "31853399", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204107448396, "ground_truth": 0}, {"key": "31853399", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324930149949, "ground_truth": 0}, {"key": "35273252", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31912138041990257, "ground_truth": 0}, {"key": "35273252", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4301473233812487, "ground_truth": 0}, {"key": "35273252", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2751297121193276, "ground_truth": 0}, {"key": "35273252", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270015223533826, "ground_truth": 0}, {"key": "35273252", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014093164049, "ground_truth": 0}, {"key": "37130459", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9678992976314544, "ground_truth": 0}, {"key": "37130459", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9945730566425656, "ground_truth": 0}, {"key": "37130459", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9782188296217544, "ground_truth": 0}, {"key": "37130459", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9830850868120805, "ground_truth": 0}, {"key": "37130459", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9835969675581556, "ground_truth": 0}, {"key": "21734003", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7461390047145621, "ground_truth": 0}, {"key": "21734003", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.812867327656068, "ground_truth": 0}, {"key": "21734003", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7122321832403582, "ground_truth": 0}, {"key": "21734003", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473807540435, "ground_truth": 0}, {"key": "21734003", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580895627124, "ground_truth": 0}, {"key": "33990737", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5544704447031575, "ground_truth": 0}, {"key": "33990737", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4551985915995131, "ground_truth": 0}, {"key": "33990737", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6406358579272677, "ground_truth": 0}, {"key": "33990737", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880011614452, "ground_truth": 0}, {"key": "33990737", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121880041428, "ground_truth": 0}, {"key": "34559912", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8991213808419463, "ground_truth": 0}, {"key": "34559912", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9372107896343578, "ground_truth": 0}, {"key": "34559912", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8255897339837113, "ground_truth": 0}, {"key": "34559912", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346121582018, "ground_truth": 0}, {"key": "34559912", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149036063065, "ground_truth": 0}, {"key": "39820439", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.13939637858025716, "ground_truth": 0}, {"key": "39820439", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4148988354270338, "ground_truth": 0}, {"key": "39820439", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5058591094964756, "ground_truth": 0}, {"key": "39820439", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.26588046393006176, "ground_truth": 0}, {"key": "39820439", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798743563071102, "ground_truth": 0}, {"key": "34759328", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8757869979151461, "ground_truth": 0}, {"key": "34759328", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9362850099874933, "ground_truth": 0}, {"key": "34759328", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.924687699057727, "ground_truth": 0}, {"key": "34759328", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9092645219943971, "ground_truth": 0}, {"key": "34759328", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9546474213070264, "ground_truth": 0}, {"key": "36939137", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7549149811967011, "ground_truth": 0}, {"key": "36939137", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8840392835373034, "ground_truth": 0}, {"key": "36939137", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8092759654089685, "ground_truth": 0}, {"key": "36939137", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760216694544, "ground_truth": 0}, {"key": "36939137", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884535433512, "ground_truth": 0}, {"key": "35851522", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7943849690956676, "ground_truth": 0}, {"key": "35851522", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8116760281364964, "ground_truth": 0}, {"key": "35851522", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6057990340109516, "ground_truth": 0}, {"key": "35851522", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494834908347, "ground_truth": 0}, {"key": "35851522", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947457186821, "ground_truth": 0}, {"key": "22412782", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5755880097424544, "ground_truth": 0}, {"key": "22412782", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7431679912589014, "ground_truth": 0}, {"key": "22412782", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5964331382125497, "ground_truth": 0}, {"key": "22412782", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291268515721, "ground_truth": 0}, {"key": "22412782", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928885878825, "ground_truth": 0}, {"key": "38579227", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8438951060323567, "ground_truth": 0}, {"key": "38579227", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8577681046011143, "ground_truth": 0}, {"key": "38579227", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8365545611557516, "ground_truth": 0}, {"key": "38579227", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148126654271, "ground_truth": 0}, {"key": "38579227", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359947954901, "ground_truth": 0}, {"key": "37206995", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8104789217619419, "ground_truth": 0}, {"key": "37206995", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.850964702305103, "ground_truth": 0}, {"key": "37206995", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7138307694635325, "ground_truth": 0}, {"key": "37206995", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104586221738, "ground_truth": 0}, {"key": "37206995", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122937125399, "ground_truth": 0}, {"key": "38700847", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7138307646651904, "ground_truth": 0}, {"key": "38700847", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.762070120036652, "ground_truth": 0}, {"key": "38700847", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8670357584304957, "ground_truth": 0}, {"key": "38700847", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581457727547, "ground_truth": 0}, {"key": "38700847", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283092666246, "ground_truth": 0}, {"key": "20246590", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9935117306559972, "ground_truth": 0}, {"key": "20246590", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9923637834596484, "ground_truth": 0}, {"key": "20246590", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.991355821808559, "ground_truth": 0}, {"key": "20246590", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9911526448260481, "ground_truth": 0}, {"key": "20246590", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9902915235949018, "ground_truth": 0}, {"key": "39141360", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7981867925140333, "ground_truth": 0}, {"key": "39141360", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7690802312337953, "ground_truth": 0}, {"key": "39141360", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8539127650517452, "ground_truth": 0}, {"key": "39141360", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920158710706, "ground_truth": 0}, {"key": "39141360", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185944007992109, "ground_truth": 0}, {"key": "37906226", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5078118451500306, "ground_truth": 0}, {"key": "37906226", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3557749172539664, "ground_truth": 0}, {"key": "37906226", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.28776781113732863, "ground_truth": 0}, {"key": "37906226", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365433208438, "ground_truth": 0}, {"key": "37906226", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49023557723571776, "ground_truth": 0}, {"key": "16201033", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011814387287, "ground_truth": 0}, {"key": "16201033", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5888891298906415, "ground_truth": 0}, {"key": "16201033", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6057990488901073, "ground_truth": 0}, {"key": "16201033", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941409018025759, "ground_truth": 0}, {"key": "16201033", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104788981788501, "ground_truth": 0}, {"key": "36469022", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6187804486650699, "ground_truth": 0}, {"key": "36469022", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5117165821586523, "ground_truth": 0}, {"key": "36469022", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45326182276752647, "ground_truth": 0}, {"key": "36469022", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494717583428, "ground_truth": 0}, {"key": "36469022", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828340620699884, "ground_truth": 0}, {"key": "31295270", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.25386103946063193, "ground_truth": 0}, {"key": "31295270", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.25091278740944045, "ground_truth": 0}, {"key": "31295270", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2658804789971832, "ground_truth": 0}, {"key": "31295270", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133092631031546, "ground_truth": 0}, {"key": "31295270", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2043419179162053, "ground_truth": 0}, {"key": "35360689", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.461016788047235, "ground_truth": 0}, {"key": "35360689", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37022538415355466, "ground_truth": 0}, {"key": "35360689", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.25238403923925157, "ground_truth": 0}, {"key": "35360689", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256359593177, "ground_truth": 0}, {"key": "35360689", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.36296919844377185, "ground_truth": 0}, {"key": "29202793", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.42250465573310686, "ground_truth": 0}, {"key": "29202793", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3849121361734987, "ground_truth": 0}, {"key": "29202793", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5292633920392059, "ground_truth": 0}, {"key": "29202793", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906376699573, "ground_truth": 0}, {"key": "29202793", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41489883658827453, "ground_truth": 0}, {"key": "35999008", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201714945665836, "ground_truth": 0}, {"key": "35999008", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45519859968347043, "ground_truth": 0}, {"key": "35999008", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46879065050561736, "ground_truth": 0}, {"key": "35999008", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643977606261, "ground_truth": 0}, {"key": "35999008", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740028336413, "ground_truth": 0}, {"key": "31797119", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8164063935937825, "ground_truth": 0}, {"key": "31797119", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8615382065094138, "ground_truth": 0}, {"key": "31797119", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8539127489772058, "ground_truth": 0}, {"key": "31797119", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382154684103, "ground_truth": 0}, {"key": "31797119", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.842863148829274, "ground_truth": 0}, {"key": "26711893", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7620700990273256, "ground_truth": 0}, {"key": "26711893", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6001883660023705, "ground_truth": 0}, {"key": "26711893", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7505527556110995, "ground_truth": 0}, {"key": "26711893", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318277335267, "ground_truth": 0}, {"key": "26711893", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593233637191, "ground_truth": 0}, {"key": "35348288", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5175709222280743, "ground_truth": 0}, {"key": "35348288", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3665897525593249, "ground_truth": 0}, {"key": "35348288", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4148988458797351, "ground_truth": 0}, {"key": "35348288", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312094053243593, "ground_truth": 0}, {"key": "35348288", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118613668703, "ground_truth": 0}, {"key": "38124131", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4436004272362107, "ground_truth": 0}, {"key": "38124131", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.14608724869549672, "ground_truth": 0}, {"key": "38124131", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2200071163474496, "ground_truth": 0}, {"key": "38124131", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310537776638, "ground_truth": 0}, {"key": "38124131", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569733074249195, "ground_truth": 0}, {"key": "20285901", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6774740530033153, "ground_truth": 0}, {"key": "20285901", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7057850239375563, "ground_truth": 0}, {"key": "20285901", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.752012574969918, "ground_truth": 0}, {"key": "20285901", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122260933809, "ground_truth": 0}, {"key": "20285901", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358721023299, "ground_truth": 0}, {"key": "35633632", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7461389965530879, "ground_truth": 0}, {"key": "35633632", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5679366143604963, "ground_truth": 0}, {"key": "35633632", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6279512249998778, "ground_truth": 0}, {"key": "35633632", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316808145896, "ground_truth": 0}, {"key": "35633632", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715209160056, "ground_truth": 0}, {"key": "10741274", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6132365438008253, "ground_truth": 0}, {"key": "10741274", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5506073670991536, "ground_truth": 0}, {"key": "10741274", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.39420095349254647, "ground_truth": 0}, {"key": "10741274", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2030746175166914, "ground_truth": 0}, {"key": "10741274", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881173048013, "ground_truth": 0}, {"key": "30605795", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6424324584709094, "ground_truth": 0}, {"key": "30605795", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7386690915014644, "ground_truth": 0}, {"key": "30605795", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5851011371515392, "ground_truth": 0}, {"key": "30605795", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300572260382, "ground_truth": 0}, {"key": "30605795", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891072815361, "ground_truth": 0}, {"key": "30539722", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.503906159935924, "ground_truth": 0}, {"key": "30539722", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3849121341612103, "ground_truth": 0}, {"key": "30539722", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5851011472600922, "ground_truth": 0}, {"key": "30539722", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253914819447, "ground_truth": 0}, {"key": "30539722", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185017228336, "ground_truth": 0}, {"key": "18639299", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.443600456892408, "ground_truth": 0}, {"key": "18639299", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3998116237730384, "ground_truth": 0}, {"key": "18639299", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3486451341997023, "ground_truth": 0}, {"key": "18639299", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735743860109004, "ground_truth": 0}, {"key": "18639299", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3629692087160495, "ground_truth": 0}, {"key": "39773552", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8044059092855118, "ground_truth": 0}, {"key": "39773552", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6187804564108987, "ground_truth": 0}, {"key": "39773552", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.674050484891815, "ground_truth": 0}, {"key": "39773552", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633754894448, "ground_truth": 0}, {"key": "39773552", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637632684183, "ground_truth": 0}, {"key": "34086410", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5736783773790499, "ground_truth": 0}, {"key": "34086410", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4263215931389239, "ground_truth": 0}, {"key": "34086410", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42250461049113186, "ground_truth": 0}, {"key": "34086410", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306417693162914, "ground_truth": 0}, {"key": "34086410", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180588940857, "ground_truth": 0}, {"key": "35454652", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8311430473180352, "ground_truth": 0}, {"key": "35454652", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8925625278473253, "ground_truth": 0}, {"key": "35454652", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8661325120609544, "ground_truth": 0}, {"key": "35454652", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254122946677, "ground_truth": 0}, {"key": "35454652", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325101954114, "ground_truth": 0}, {"key": "36158310", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8333245845365239, "ground_truth": 0}, {"key": "36158310", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4359015270039291, "ground_truth": 0}, {"key": "36158310", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.925229962371438, "ground_truth": 0}, {"key": "36158310", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430423565588, "ground_truth": 0}, {"key": "36158310", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215313222941, "ground_truth": 0}, {"key": "35688387", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3328523491289148, "ground_truth": 0}, {"key": "35688387", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7446563389833423, "ground_truth": 0}, {"key": "35688387", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.20181321937103355, "ground_truth": 0}, {"key": "35688387", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756751187197744, "ground_truth": 0}, {"key": "35688387", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047584559765686, "ground_truth": 0}, {"key": "34209292", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.734119526486322, "ground_truth": 0}, {"key": "34209292", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.699254426247746, "ground_truth": 0}, {"key": "34209292", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7106283329226362, "ground_truth": 0}, {"key": "34209292", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759631268419, "ground_truth": 0}, {"key": "34209292", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253878172862, "ground_truth": 0}, {"key": "25037859", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.46295862509666597, "ground_truth": 0}, {"key": "25037859", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.509764379848105, "ground_truth": 0}, {"key": "25037859", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7248702520605261, "ground_truth": 0}, {"key": "25037859", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358652703137, "ground_truth": 0}, {"key": "25037859", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738758315554626, "ground_truth": 0}, {"key": "36412121", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9184802431282137, "ground_truth": 0}, {"key": "36412121", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8539127483390501, "ground_truth": 0}, {"key": "36412121", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.891811038597923, "ground_truth": 0}, {"key": "36412121", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583489655814, "ground_truth": 0}, {"key": "36412121", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549575372592, "ground_truth": 0}, {"key": "34909172", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.766293629763944, "ground_truth": 0}, {"key": "34909172", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8080672042953603, "ground_truth": 0}, {"key": "34909172", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8757869859256705, "ground_truth": 0}, {"key": "34909172", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215266926631, "ground_truth": 0}, {"key": "34909172", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.635222444721354, "ground_truth": 0}, {"key": "39011806", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7563575473621457, "ground_truth": 0}, {"key": "39011806", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8783142459961936, "ground_truth": 0}, {"key": "39011806", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359850163801, "ground_truth": 0}, {"key": "39011806", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797089677707, "ground_truth": 0}, {"key": "39011806", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288523978211, "ground_truth": 0}, {"key": "33096163", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7090191123573399, "ground_truth": 0}, {"key": "33096163", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8947894674935863, "ground_truth": 0}, {"key": "33096163", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8418256469913792, "ground_truth": 0}, {"key": "33096163", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797582263636, "ground_truth": 0}, {"key": "33096163", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321951659183, "ground_truth": 0}, {"key": "38762205", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8969755691168743, "ground_truth": 0}, {"key": "38762205", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9219218361318879, "ground_truth": 0}, {"key": "38762205", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8714748545991682, "ground_truth": 0}, {"key": "38762205", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759517255872, "ground_truth": 0}, {"key": "38762205", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107941536482, "ground_truth": 0}, {"key": "35519177", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7446563340389969, "ground_truth": 0}, {"key": "35519177", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7185943953776895, "ground_truth": 0}, {"key": "35519177", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8344068898627132, "ground_truth": 0}, {"key": "35519177", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.882427862865441, "ground_truth": 0}, {"key": "35519177", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105584105736, "ground_truth": 0}, {"key": "36192531", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7371581545300775, "ground_truth": 0}, {"key": "36192531", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6206216235626016, "ground_truth": 0}, {"key": "36192531", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.598312190016065, "ground_truth": 0}, {"key": "36192531", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216315430623, "ground_truth": 0}, {"key": "36192531", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512764139057, "ground_truth": 0}, {"key": "33160852", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9453993961735364, "ground_truth": 0}, {"key": "33160852", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9358173562339228, "ground_truth": 0}, {"key": "33160852", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9600626838834286, "ground_truth": 0}, {"key": "33160852", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9872772928236453, "ground_truth": 0}, {"key": "33160852", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9678992909378753, "ground_truth": 0}, {"key": "36312304", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6370308158465319, "ground_truth": 0}, {"key": "36312304", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48438005753642066, "ground_truth": 0}, {"key": "36312304", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794003892899607, "ground_truth": 0}, {"key": "36312304", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609384225079506, "ground_truth": 0}, {"key": "36312304", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306416489136075, "ground_truth": 0}, {"key": "33773343", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6859494802658495, "ground_truth": 0}, {"key": "33773343", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4130035942825449, "ground_truth": 0}, {"key": "33773343", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.558327004562623, "ground_truth": 0}, {"key": "33773343", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073674575855, "ground_truth": 0}, {"key": "33773343", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733343506749564, "ground_truth": 0}, {"key": "34913320", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.646013659550283, "ground_truth": 0}, {"key": "34913320", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984663629814, "ground_truth": 0}, {"key": "34913320", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5907792050808687, "ground_truth": 0}, {"key": "34913320", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601193450313, "ground_truth": 0}, {"key": "34913320", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918121610956, "ground_truth": 0}, {"key": "33784155", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.759225402342443, "ground_truth": 0}, {"key": "33784155", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8652240883052561, "ground_truth": 0}, {"key": "33784155", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5851011722922776, "ground_truth": 0}, {"key": "33784155", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195138789958, "ground_truth": 0}, {"key": "33784155", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504893210989, "ground_truth": 0}, {"key": "24085062", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9944450753246442, "ground_truth": 0}, {"key": "24085062", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9982247395117179, "ground_truth": 0}, {"key": "24085062", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9898303423846457, "ground_truth": 0}, {"key": "24085062", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9958660320957433, "ground_truth": 0}, {"key": "24085062", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9969721651759719, "ground_truth": 0}, {"key": "33893487", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3575675047792852, "ground_truth": 0}, {"key": "33893487", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1766716027073654, "ground_truth": 0}, {"key": "33893487", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3056973166602174, "ground_truth": 0}, {"key": "33893487", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41300356904626423, "ground_truth": 0}, {"key": "33893487", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.364777533537916, "ground_truth": 0}, {"key": "40913011", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8489721903620105, "ground_truth": 0}, {"key": "40913011", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8407825959018153, "ground_truth": 0}, {"key": "40913011", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8757869987904247, "ground_truth": 0}, {"key": "40913011", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110318950423, "ground_truth": 0}, {"key": "40913011", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392777682959, "ground_truth": 0}, {"key": "29642545", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4416730165937268, "ground_truth": 0}, {"key": "29642545", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2751297298049212, "ground_truth": 0}, {"key": "29642545", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31405053955736734, "ground_truth": 0}, {"key": "29642545", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930800957870817, "ground_truth": 0}, {"key": "29642545", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132651553991493, "ground_truth": 0}, {"key": "35969159", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7325918237192663, "ground_truth": 0}, {"key": "35969159", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8418256500042175, "ground_truth": 0}, {"key": "35969159", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.680878596372223, "ground_truth": 0}, {"key": "35969159", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240882542828, "ground_truth": 0}, {"key": "35969159", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846378581634, "ground_truth": 0}, {"key": "37081669", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3056973320988845, "ground_truth": 0}, {"key": "37081669", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4610167304972293, "ground_truth": 0}, {"key": "37081669", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.35756750117121977, "ground_truth": 0}, {"key": "37081669", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468813785602, "ground_truth": 0}, {"key": "37081669", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881074027388, "ground_truth": 0}, {"key": "40048022", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7592254100692445, "ground_truth": 0}, {"key": "40048022", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7853085932658359, "ground_truth": 0}, {"key": "40048022", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7592254102861993, "ground_truth": 0}, {"key": "40048022", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680321018346, "ground_truth": 0}, {"key": "40048022", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601526448517, "ground_truth": 0}, {"key": "32884004", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8469578404600834, "ground_truth": 0}, {"key": "32884004", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8697145875334065, "ground_truth": 0}, {"key": "32884004", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432081063375, "ground_truth": 0}, {"key": "32884004", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.763483769006917, "ground_truth": 0}, {"key": "32884004", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.827828152680533, "ground_truth": 0}, {"key": "39022490", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7549149633343298, "ground_truth": 0}, {"key": "39022490", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8895288393200707, "ground_truth": 0}, {"key": "39022490", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8568122982834339, "ground_truth": 0}, {"key": "39022490", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711798739323, "ground_truth": 0}, {"key": "39022490", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.844921530484865, "ground_truth": 0}, {"key": "35159385", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5964331288994787, "ground_truth": 0}, {"key": "35159385", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5869964397799018, "ground_truth": 0}, {"key": "35159385", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6513548855956488, "ground_truth": 0}, {"key": "35159385", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489722017127954, "ground_truth": 0}, {"key": "35159385", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673023589541, "ground_truth": 0}, {"key": "34363669", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.24798741880607778, "ground_truth": 0}, {"key": "34363669", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4551986027067904, "ground_truth": 0}, {"key": "34363669", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.33807712989900673, "ground_truth": 0}, {"key": "34363669", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199292392859, "ground_truth": 0}, {"key": "34363669", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510837870381684, "ground_truth": 0}, {"key": "36119687", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9600626870141012, "ground_truth": 0}, {"key": "36119687", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9005297891306568, "ground_truth": 0}, {"key": "36119687", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9235923233657688, "ground_truth": 0}, {"key": "36119687", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9671630444557806, "ground_truth": 0}, {"key": "36119687", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299637295752, "ground_truth": 0}, {"key": "35217446", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7799929073963658, "ground_truth": 0}, {"key": "35217446", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6688802783066613, "ground_truth": 0}, {"key": "35217446", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7813306352214128, "ground_truth": 0}, {"key": "35217446", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9184802342626373, "ground_truth": 0}, {"key": "35217446", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.873214817007267, "ground_truth": 0}, {"key": "39049331", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8558511513823918, "ground_truth": 0}, {"key": "39049331", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8080672019487973, "ground_truth": 0}, {"key": "39049331", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.774583402183358, "ground_truth": 0}, {"key": "39049331", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318148074193, "ground_truth": 0}, {"key": "39049331", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281474587802, "ground_truth": 0}, {"key": "36472242", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8116760159501573, "ground_truth": 0}, {"key": "36472242", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8068526266378101, "ground_truth": 0}, {"key": "36472242", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8140528002917681, "ground_truth": 0}, {"key": "36472242", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816148974417427, "ground_truth": 0}, {"key": "36472242", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867864513538, "ground_truth": 0}, {"key": "31854721", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8344068929633222, "ground_truth": 0}, {"key": "31854721", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6859494702404431, "ground_truth": 0}, {"key": "31854721", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7461390126490914, "ground_truth": 0}, {"key": "31854721", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.738669077710532, "ground_truth": 0}, {"key": "31854721", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203655424774, "ground_truth": 0}, {"key": "18725849", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4513265050324637, "ground_truth": 0}, {"key": "18725849", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47657963990865876, "ground_truth": 0}, {"key": "18725849", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.41111087258462115, "ground_truth": 0}, {"key": "18725849", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633154876770696, "ground_truth": 0}, {"key": "18725849", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121533815451, "ground_truth": 0}, {"key": "36883179", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.21601151881018396, "ground_truth": 0}, {"key": "36883179", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3328523377840424, "ground_truth": 0}, {"key": "36883179", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.29421495890182875, "ground_truth": 0}, {"key": "36883179", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015882891964, "ground_truth": 0}, {"key": "36883179", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510837517907696, "ground_truth": 0}, {"key": "34266359", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7341195307948187, "ground_truth": 0}, {"key": "34266359", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8344068854937273, "ground_truth": 0}, {"key": "34266359", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.839733971807402, "ground_truth": 0}, {"key": "34266359", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690639441876, "ground_truth": 0}, {"key": "34266359", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680101865534, "ground_truth": 0}, {"key": "31920289", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5869964092551523, "ground_truth": 0}, {"key": "31920289", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5794003975332704, "ground_truth": 0}, {"key": "31920289", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5117165957499482, "ground_truth": 0}, {"key": "31920289", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570646153211606, "ground_truth": 0}, {"key": "31920289", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476690086217, "ground_truth": 0}, {"key": "36292997", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6352224526388678, "ground_truth": 0}, {"key": "36292997", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7662936471943563, "ground_truth": 0}, {"key": "36292997", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6150878551669808, "ground_truth": 0}, {"key": "36292997", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358292992516, "ground_truth": 0}, {"key": "36292997", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526171599424, "ground_truth": 0}, {"key": "30412533", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9252299539439512, "ground_truth": 0}, {"key": "30412533", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6169358201238243, "ground_truth": 0}, {"key": "30412533", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7704647910821184, "ground_truth": 0}, {"key": "30412533", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191348061053, "ground_truth": 0}, {"key": "30412533", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998672301205, "ground_truth": 0}, {"key": "40433191", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9637799441077431, "ground_truth": 0}, {"key": "40433191", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9462003599983974, "ground_truth": 0}, {"key": "40433191", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.940789748545467, "ground_truth": 0}, {"key": "40433191", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.944994710357074, "ground_truth": 0}, {"key": "40433191", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9492946319090764, "ground_truth": 0}, {"key": "34565591", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2974699223436949, "ground_truth": 0}, {"key": "34565591", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3276682909424659, "ground_truth": 0}, {"key": "34565591", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.47852881991703405, "ground_truth": 0}, {"key": "34565591", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651624157110004, "ground_truth": 0}, {"key": "34565591", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4687906296255477, "ground_truth": 0}, {"key": "36062480", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8529354851120416, "ground_truth": 0}, {"key": "36062480", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8807970747137089, "ground_truth": 0}, {"key": "36062480", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9496693676730154, "ground_truth": 0}, {"key": "36062480", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9403530533561834, "ground_truth": 0}, {"key": "36062480", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825889334231, "ground_truth": 0}, {"key": "37276883", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6859494845377797, "ground_truth": 0}, {"key": "37276883", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6926419794647133, "ground_truth": 0}, {"key": "37276883", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8606036189753679, "ground_truth": 0}, {"key": "37276883", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737888105958, "ground_truth": 0}, {"key": "37276883", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506682193734, "ground_truth": 0}, {"key": "38509260", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7057850367914061, "ground_truth": 0}, {"key": "38509260", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256023280921, "ground_truth": 0}, {"key": "38509260", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6636689596856188, "ground_truth": 0}, {"key": "38509260", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581773100163, "ground_truth": 0}, {"key": "38509260", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352676687855, "ground_truth": 0}, {"key": "37139607", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8799743740803434, "ground_truth": 0}, {"key": "37139607", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8918110551460049, "ground_truth": 0}, {"key": "37139607", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8895288473698522, "ground_truth": 0}, {"key": "37139607", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325163624256, "ground_truth": 0}, {"key": "37139607", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.896251380819509, "ground_truth": 0}, {"key": "37092824", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9099070170770128, "ground_truth": 0}, {"key": "37092824", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9207896795344294, "ground_truth": 0}, {"key": "37092824", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9676556691591212, "ground_truth": 0}, {"key": "37092824", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213884954328, "ground_truth": 0}, {"key": "37092824", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998565874085, "ground_truth": 0}, {"key": "32191802", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9372107938232225, "ground_truth": 0}, {"key": "32191802", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159547947482, "ground_truth": 0}, {"key": "32191802", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9465966700242647, "ground_truth": 0}, {"key": "32191802", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026096024805181, "ground_truth": 0}, {"key": "32191802", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9257686219062856, "ground_truth": 0}, {"key": "39396038", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9549844670993691, "ground_truth": 0}, {"key": "39396038", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9559813480849415, "ground_truth": 0}, {"key": "39396038", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.963506235520956, "ground_truth": 0}, {"key": "39396038", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9597620559233943, "ground_truth": 0}, {"key": "39396038", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.949294631321441, "ground_truth": 0}, {"key": "39076884", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947332096019, "ground_truth": 0}, {"key": "39076884", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8104788924046116, "ground_truth": 0}, {"key": "39076884", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6548947266493731, "ground_truth": 0}, {"key": "39076884", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331450095453, "ground_truth": 0}, {"key": "39076884", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321844611076, "ground_truth": 0}, {"key": "27763432", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39981167442580245, "ground_truth": 0}, {"key": "27763432", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.44939264886489494, "ground_truth": 0}, {"key": "27763432", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.34334176106169756, "ground_truth": 0}, {"key": "27763432", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590151891281653, "ground_truth": 0}, {"key": "27763432", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213096049925, "ground_truth": 0}, {"key": "37806929", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8568122914557249, "ground_truth": 0}, {"key": "37806929", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8539127499383441, "ground_truth": 0}, {"key": "37806929", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8933094005975475, "ground_truth": 0}, {"key": "37806929", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059231979264, "ground_truth": 0}, {"key": "37806929", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952951511068, "ground_truth": 0}, {"key": "32334186", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8210441155392557, "ground_truth": 0}, {"key": "32334186", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8244619345822601, "ground_truth": 0}, {"key": "32334186", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6619228628109606, "ground_truth": 0}, {"key": "32334186", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283900594943, "ground_truth": 0}, {"key": "32334186", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215218576809, "ground_truth": 0}, {"key": "36187324", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7170118946255288, "ground_truth": 0}, {"key": "36187324", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.874934619661898, "ground_truth": 0}, {"key": "36187324", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6654105583565483, "ground_truth": 0}, {"key": "36187324", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284168698295, "ground_truth": 0}, {"key": "36187324", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277788468996, "ground_truth": 0}, {"key": "35306009", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9525741269133076, "ground_truth": 0}, {"key": "35306009", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9591542866245988, "ground_truth": 0}, {"key": "35306009", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9726235108374425, "ground_truth": 0}, {"key": "35306009", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9674102560652509, "ground_truth": 0}, {"key": "35306009", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9690910421702061, "ground_truth": 0}, {"key": "39490050", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.214691415877139, "ground_truth": 0}, {"key": "39490050", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3174262856274971, "ground_truth": 0}, {"key": "39490050", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.38491216713654747, "ground_truth": 0}, {"key": "39490050", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205996056840315, "ground_truth": 0}, {"key": "39490050", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.19314737705703283, "ground_truth": 0}, {"key": "38072149", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6057990650961766, "ground_truth": 0}, {"key": "38072149", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984955809357, "ground_truth": 0}, {"key": "38072149", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6352224338295945, "ground_truth": 0}, {"key": "38072149", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943186825962, "ground_truth": 0}, {"key": "38072149", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615846225168, "ground_truth": 0}, {"key": "35899689", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7106283148653003, "ground_truth": 0}, {"key": "35899689", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.42059959368141403, "ground_truth": 0}, {"key": "35899689", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6774740325946633, "ground_truth": 0}, {"key": "35899689", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.68594944519152, "ground_truth": 0}, {"key": "35899689", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317114561984, "ground_truth": 0}, {"key": "27994518", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6808786052320902, "ground_truth": 0}, {"key": "27994518", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5506073801503978, "ground_truth": 0}, {"key": "27994518", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7732163660966729, "ground_truth": 0}, {"key": "27994518", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601611875462, "ground_truth": 0}, {"key": "27994518", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476810441592, "ground_truth": 0}, {"key": "10615479", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.19682621243576107, "ground_truth": 0}, {"key": "10615479", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1059482791834797, "ground_truth": 0}, {"key": "10615479", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3090237035079271, "ground_truth": 0}, {"key": "10615479", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1859472049689441, "ground_truth": 0}, {"key": "10615479", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.11596071765384677, "ground_truth": 0}, {"key": "40186667", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9079671450297672, "ground_truth": 0}, {"key": "40186667", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5851011316254721, "ground_truth": 0}, {"key": "40186667", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.752012578752797, "ground_truth": 0}, {"key": "40186667", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424477734959, "ground_truth": 0}, {"key": "40186667", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270169788542, "ground_truth": 0}, {"key": "38622886", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6095241444296963, "ground_truth": 0}, {"key": "38622886", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48242912105906616, "ground_truth": 0}, {"key": "38622886", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7759445618110995, "ground_truth": 0}, {"key": "38622886", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789209527962, "ground_truth": 0}, {"key": "38622886", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575573139114, "ground_truth": 0}, {"key": "40686943", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8633916025488212, "ground_truth": 0}, {"key": "40686943", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8140528094314688, "ground_truth": 0}, {"key": "40686943", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8198933237942977, "ground_truth": 0}, {"key": "40686943", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357654572982, "ground_truth": 0}, {"key": "40686943", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721932161938, "ground_truth": 0}, {"key": "30604567", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.978051744809855, "ground_truth": 0}, {"key": "30604567", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9390248185618277, "ground_truth": 0}, {"key": "30604567", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9178933773913797, "ground_truth": 0}, {"key": "30604567", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923185449837, "ground_truth": 0}, {"key": "30604567", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080734999402, "ground_truth": 0}, {"key": "35440903", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7563575870183167, "ground_truth": 0}, {"key": "35440903", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6859494565973417, "ground_truth": 0}, {"key": "35440903", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8344068980574897, "ground_truth": 0}, {"key": "35440903", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918275373633, "ground_truth": 0}, {"key": "35440903", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333246009216859, "ground_truth": 0}, {"key": "37219533", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.32594953899318263, "ground_truth": 0}, {"key": "37219533", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942842626178, "ground_truth": 0}, {"key": "37219533", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.579400410378406, "ground_truth": 0}, {"key": "37219533", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.30902371056912353, "ground_truth": 0}, {"key": "37219533", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606814444926014, "ground_truth": 0}, {"key": "40178965", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7943849662402676, "ground_truth": 0}, {"key": "40178965", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8267117947549314, "ground_truth": 0}, {"key": "40178965", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8824278601549601, "ground_truth": 0}, {"key": "40178965", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9309620698152078, "ground_truth": 0}, {"key": "40178965", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277836513505, "ground_truth": 0}, {"key": "13750468", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011463267776, "ground_truth": 0}, {"key": "13750468", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6531269092855765, "ground_truth": 0}, {"key": "13750468", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755880245315015, "ground_truth": 0}, {"key": "13750468", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849648141456, "ground_truth": 0}, {"key": "13750468", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.566018490436493, "ground_truth": 0}, {"key": "17754949", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7634837855723, "ground_truth": 0}, {"key": "17754949", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5117165996586669, "ground_truth": 0}, {"key": "17754949", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201715150121034, "ground_truth": 0}, {"key": "17754949", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.713830757673817, "ground_truth": 0}, {"key": "17754949", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267118059872629, "ground_truth": 0}, {"key": "36675623", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9556514142748709, "ground_truth": 0}, {"key": "36675623", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9563089370373622, "ground_truth": 0}, {"key": "36675623", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9481545306180276, "ground_truth": 0}, {"key": "36675623", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037212611369, "ground_truth": 0}, {"key": "36675623", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9481545311980933, "ground_truth": 0}, {"key": "40035440", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9903663485520467, "ground_truth": 0}, {"key": "40035440", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9853843317753668, "ground_truth": 0}, {"key": "40035440", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9376689594017622, "ground_truth": 0}, {"key": "40035440", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.962952827524828, "ground_truth": 0}, {"key": "40035440", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.977883413362521, "ground_truth": 0}, {"key": "37685909", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3123699941093423, "ground_truth": 0}, {"key": "37685909", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.20181322303239238, "ground_truth": 0}, {"key": "37685909", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.20434190599250163, "ground_truth": 0}, {"key": "37685909", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33458946400197853, "ground_truth": 0}, {"key": "37685909", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2598256467720917, "ground_truth": 0}, {"key": "36938787", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9213576125658892, "ground_truth": 0}, {"key": "36938787", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9294404084471224, "ground_truth": 0}, {"key": "36938787", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8164063840978124, "ground_truth": 0}, {"key": "36938787", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.806852633534116, "ground_truth": 0}, {"key": "36938787", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424342281682, "ground_truth": 0}, {"key": "39398068", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4668455726573253, "ground_truth": 0}, {"key": "39398068", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.33111976121871006, "ground_truth": 0}, {"key": "39398068", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6460136832132387, "ground_truth": 0}, {"key": "39398068", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.494140876339433, "ground_truth": 0}, {"key": "39398068", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061675760552, "ground_truth": 0}, {"key": "39926408", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30569731593810096, "ground_truth": 0}, {"key": "39926408", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6388352672497545, "ground_truth": 0}, {"key": "39926408", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.48438009334877685, "ground_truth": 0}, {"key": "39926408", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023562265372733, "ground_truth": 0}, {"key": "39926408", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990617531814, "ground_truth": 0}, {"key": "40465336", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6601724066820701, "ground_truth": 0}, {"key": "40465336", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6057990536534724, "ground_truth": 0}, {"key": "40465336", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5945512680026351, "ground_truth": 0}, {"key": "40465336", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737249174453, "ground_truth": 0}, {"key": "40465336", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876300161556251, "ground_truth": 0}, {"key": "34173549", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8615382022398779, "ground_truth": 0}, {"key": "34173549", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7943849561780999, "ground_truth": 0}, {"key": "34173549", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8449215381759876, "ground_truth": 0}, {"key": "34173549", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.812867303558629, "ground_truth": 0}, {"key": "34173549", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068976805518, "ground_truth": 0}, {"key": "33541535", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.770464787574052, "ground_truth": 0}, {"key": "33541535", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5428632756383727, "ground_truth": 0}, {"key": "33541535", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7295198038555274, "ground_truth": 0}, {"key": "33541535", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743655372562, "ground_truth": 0}, {"key": "33541535", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094728419098, "ground_truth": 0}, {"key": "35685195", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445599182379, "ground_truth": 0}, {"key": "35685195", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512684769392, "ground_truth": 0}, {"key": "35685195", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.685949454910876, "ground_truth": 0}, {"key": "35685195", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224772310022, "ground_truth": 0}, {"key": "35685195", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.577495367072359, "ground_truth": 0}, {"key": "28440730", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.24653333053995707, "ground_truth": 0}, {"key": "28440730", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.42250463679096195, "ground_truth": 0}, {"key": "28440730", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4513265032341153, "ground_truth": 0}, {"key": "28440730", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.38861801951604635, "ground_truth": 0}, {"key": "28440730", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1980641864608303, "ground_truth": 0}, {"key": "38338714", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9155072455966334, "ground_truth": 0}, {"key": "38338714", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8947894641047615, "ground_truth": 0}, {"key": "38338714", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8947894637330196, "ground_truth": 0}, {"key": "38338714", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.947769147439733, "ground_truth": 0}, {"key": "38338714", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9433475741569621, "ground_truth": 0}, {"key": "32191881", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.32939172294847224, "ground_truth": 0}, {"key": "32191881", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2133771630770968, "ground_truth": 0}, {"key": "32191881", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.33807713573111975, "ground_truth": 0}, {"key": "32191881", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559408164304318, "ground_truth": 0}, {"key": "32191881", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2068940573427241, "ground_truth": 0}, {"key": "37707251", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5467381493889204, "ground_truth": 0}, {"key": "37707251", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6671476718385179, "ground_truth": 0}, {"key": "37707251", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8152324844182175, "ground_truth": 0}, {"key": "37707251", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.753466661404763, "ground_truth": 0}, {"key": "37707251", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352845284814, "ground_truth": 0}, {"key": "40172567", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3191213765747175, "ground_truth": 0}, {"key": "40172567", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41679668397065905, "ground_truth": 0}, {"key": "40172567", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4205996014768207, "ground_truth": 0}, {"key": "40172567", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591101685188, "ground_truth": 0}, {"key": "40172567", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.492188120249112, "ground_truth": 0}, {"key": "33113255", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8267118057835989, "ground_truth": 0}, {"key": "33113255", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.818736778630861, "ground_truth": 0}, {"key": "33113255", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7786493233972177, "ground_truth": 0}, {"key": "33113255", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701136246353, "ground_truth": 0}, {"key": "33113255", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891429263974, "ground_truth": 0}, {"key": "33022143", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6113819817197904, "ground_truth": 0}, {"key": "33022143", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40922078931940103, "ground_truth": 0}, {"key": "33022143", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.24944723191062923, "ground_truth": 0}, {"key": "33022143", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208212999925284, "ground_truth": 0}, {"key": "33022143", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117166260689123, "ground_truth": 0}, {"key": "32084473", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9390248267510036, "ground_truth": 0}, {"key": "32084473", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9412234369088813, "ground_truth": 0}, {"key": "32084473", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9416541518553975, "ground_truth": 0}, {"key": "32084473", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080710563476, "ground_truth": 0}, {"key": "32084473", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9289263236521429, "ground_truth": 0}, {"key": "40564245", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39047584585951356, "ground_truth": 0}, {"key": "40564245", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.668880282373813, "ground_truth": 0}, {"key": "40564245", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7704647767664129, "ground_truth": 0}, {"key": "40564245", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448014017957311, "ground_truth": 0}, {"key": "40564245", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.615087846040049, "ground_truth": 0}, {"key": "31717213", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.781330625330977, "ground_truth": 0}, {"key": "31717213", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6261241794927346, "ground_truth": 0}, {"key": "31717213", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8289388188549591, "ground_truth": 0}, {"key": "31717213", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.644225080238725, "ground_truth": 0}, {"key": "31717213", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526090610157, "ground_truth": 0}, {"key": "34861894", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6424324601108743, "ground_truth": 0}, {"key": "34861894", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7154239854499453, "ground_truth": 0}, {"key": "34861894", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5774953472039102, "ground_truth": 0}, {"key": "34861894", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.615087856408524, "ground_truth": 0}, {"key": "34861894", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.707404730316676, "ground_truth": 0}, {"key": "40838760", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8697145702368643, "ground_truth": 0}, {"key": "40838760", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9026096027703856, "ground_truth": 0}, {"key": "40838760", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7772998491606368, "ground_truth": 0}, {"key": "40838760", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352645010114, "ground_truth": 0}, {"key": "40838760", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677539744627, "ground_truth": 0}, {"key": "40044849", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7892337013679547, "ground_truth": 0}, {"key": "40044849", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6261241705770766, "ground_truth": 0}, {"key": "40044849", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7676898417609245, "ground_truth": 0}, {"key": "40044849", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711636371545, "ground_truth": 0}, {"key": "40044849", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352452099744, "ground_truth": 0}, {"key": "30296116", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30074556495430393, "ground_truth": 0}, {"key": "30296116", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5370413791946765, "ground_truth": 0}, {"key": "30296116", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6020615817322781, "ground_truth": 0}, {"key": "30296116", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593456933942, "ground_truth": 0}, {"key": "30296116", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234977042622, "ground_truth": 0}, {"key": "34931360", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.692642004535018, "ground_truth": 0}, {"key": "34931360", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5698526417959798, "ground_truth": 0}, {"key": "34931360", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6671476830470476, "ground_truth": 0}, {"key": "34931360", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582689343625, "ground_truth": 0}, {"key": "34931360", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935446460792, "ground_truth": 0}, {"key": "18862422", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5964331707872981, "ground_truth": 0}, {"key": "18862422", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8333246116099063, "ground_truth": 0}, {"key": "18862422", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5525397144636066, "ground_truth": 0}, {"key": "18862422", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269864985642, "ground_truth": 0}, {"key": "18862422", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.747615945140488, "ground_truth": 0}, {"key": "36361140", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9294404040814627, "ground_truth": 0}, {"key": "36361140", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9019206778861191, "ground_truth": 0}, {"key": "36361140", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9219218390162053, "ground_truth": 0}, {"key": "36361140", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9465966662734112, "ground_truth": 0}, {"key": "36361140", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.901227408949022, "ground_truth": 0}, {"key": "39703329", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.355774876147297, "ground_truth": 0}, {"key": "39703329", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.33982761832684316, "ground_truth": 0}, {"key": "39703329", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30404168278468124, "ground_truth": 0}, {"key": "39703329", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270014332694452, "ground_truth": 0}, {"key": "39703329", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966589020605, "ground_truth": 0}, {"key": "34033324", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9299510357926016, "ground_truth": 0}, {"key": "34033324", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8955226727771252, "ground_truth": 0}, {"key": "34033324", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7170118824407491, "ground_truth": 0}, {"key": "34033324", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.953621794662288, "ground_truth": 0}, {"key": "34033324", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425276427278, "ground_truth": 0}, {"key": "35658862", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7866228215149601, "ground_truth": 0}, {"key": "35658862", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9304582651158373, "ground_truth": 0}, {"key": "35658862", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8344068907624262, "ground_truth": 0}, {"key": "35658862", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592253922913684, "ground_truth": 0}, {"key": "35658862", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702984370831, "ground_truth": 0}, {"key": "36092657", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.670608260198377, "ground_truth": 0}, {"key": "36092657", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8479677548827211, "ground_truth": 0}, {"key": "36092657", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7577943875020958, "ground_truth": 0}, {"key": "36092657", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918261077928, "ground_truth": 0}, {"key": "36092657", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680123711778, "ground_truth": 0}, {"key": "26333438", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "26333438", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5851011428958383, "ground_truth": 0}, {"key": "26333438", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5869964302975774, "ground_truth": 0}, {"key": "26333438", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324741615641, "ground_truth": 0}, {"key": "26333438", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311910703938, "ground_truth": 0}, {"key": "34184963", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4148988551489136, "ground_truth": 0}, {"key": "34184963", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5253688274978089, "ground_truth": 0}, {"key": "34184963", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30902372910605086, "ground_truth": 0}, {"key": "34184963", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370414086293942, "ground_truth": 0}, {"key": "34184963", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3023910831317617, "ground_truth": 0}, {"key": "35069975", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5350984113849901, "ground_truth": 0}, {"key": "35069975", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.501953111004587, "ground_truth": 0}, {"key": "35069975", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6424324745030798, "ground_truth": 0}, {"key": "35069975", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4186969084678006, "ground_truth": 0}, {"key": "35069975", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878559246888, "ground_truth": 0}, {"key": "36443950", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5136684640248361, "ground_truth": 0}, {"key": "36443950", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.36840568563218423, "ground_truth": 0}, {"key": "36443950", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.35936413903701375, "ground_truth": 0}, {"key": "36443950", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004099070087, "ground_truth": 0}, {"key": "36443950", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121957994914407, "ground_truth": 0}, {"key": "29460858", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.28776783853758886, "ground_truth": 0}, {"key": "29460858", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2658804731403526, "ground_truth": 0}, {"key": "29460858", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.307358034971655, "ground_truth": 0}, {"key": "29460858", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510525518386553, "ground_truth": 0}, {"key": "29460858", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939263610357216, "ground_truth": 0}, {"key": "36155704", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5175708708622481, "ground_truth": 0}, {"key": "36155704", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22815648388766072, "ground_truth": 0}, {"key": "36155704", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3757064531242515, "ground_truth": 0}, {"key": "36155704", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735743892386275, "ground_truth": 0}, {"key": "36155704", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2465333278734118, "ground_truth": 0}, {"key": "37185211", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.833324601910339, "ground_truth": 0}, {"key": "37185211", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8031737910501037, "ground_truth": 0}, {"key": "37185211", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8092759753414538, "ground_truth": 0}, {"key": "37185211", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772393574009, "ground_truth": 0}, {"key": "37185211", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.899121380940104, "ground_truth": 0}, {"key": "36454885", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6601724101020615, "ground_truth": 0}, {"key": "36454885", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5794003830998533, "ground_truth": 0}, {"key": "36454885", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4320633969508271, "ground_truth": 0}, {"key": "36454885", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.613236560604586, "ground_truth": 0}, {"key": "36454885", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307535233291, "ground_truth": 0}, {"key": "33148906", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44552952377973315, "ground_truth": 0}, {"key": "33148906", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1755380577254813, "ground_truth": 0}, {"key": "33148906", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2942149662290452, "ground_truth": 0}, {"key": "33148906", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.36296919589235266, "ground_truth": 0}, {"key": "33148906", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2751297230162266, "ground_truth": 0}, {"key": "18086604", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.29746995969662626, "ground_truth": 0}, {"key": "18086604", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5058591191283055, "ground_truth": 0}, {"key": "18086604", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.19930800734749116, "ground_truth": 0}, {"key": "18086604", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.214691416194383, "ground_truth": 0}, {"key": "18086604", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284184524141246, "ground_truth": 0}, {"key": "33693397", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702844051799, "ground_truth": 0}, {"key": "33693397", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159450894598, "ground_truth": 0}, {"key": "33693397", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7866228052895926, "ground_truth": 0}, {"key": "33693397", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080671861670502, "ground_truth": 0}, {"key": "33693397", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121826063071, "ground_truth": 0}, {"key": "39501530", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.36477752349258236, "ground_truth": 0}, {"key": "39501530", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3665897582935255, "ground_truth": 0}, {"key": "39501530", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3738758144498139, "ground_truth": 0}, {"key": "39501530", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242353937151341, "ground_truth": 0}, {"key": "39501530", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262482540312, "ground_truth": 0}, {"key": "30948874", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8840392876096311, "ground_truth": 0}, {"key": "30948874", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7563575816689094, "ground_truth": 0}, {"key": "30948874", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8791467571298651, "ground_truth": 0}, {"key": "30948874", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.93487245079148, "ground_truth": 0}, {"key": "30948874", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681103100938, "ground_truth": 0}, {"key": "39410675", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8449215235193843, "ground_truth": 0}, {"key": "39410675", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7648916012730277, "ground_truth": 0}, {"key": "39410675", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201714951533978, "ground_truth": 0}, {"key": "39410675", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898256068467, "ground_truth": 0}, {"key": "39410675", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545652342491, "ground_truth": 0}, {"key": "32903337", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4320633853101653, "ground_truth": 0}, {"key": "32903337", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.31742625305824596, "ground_truth": 0}, {"key": "32903337", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5292633707329433, "ground_truth": 0}, {"key": "32903337", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804523755726, "ground_truth": 0}, {"key": "32903337", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897304557241, "ground_truth": 0}, {"key": "27685132", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6132365277030091, "ground_truth": 0}, {"key": "27685132", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238779823564, "ground_truth": 0}, {"key": "27685132", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4882833781970819, "ground_truth": 0}, {"key": "27685132", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723744340512, "ground_truth": 0}, {"key": "27685132", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017605300461, "ground_truth": 0}, {"key": "22791471", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5813031265613833, "ground_truth": 0}, {"key": "22791471", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324798497867, "ground_truth": 0}, {"key": "22791471", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8418256282163467, "ground_truth": 0}, {"key": "22791471", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.71383074002486, "ground_truth": 0}, {"key": "22791471", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241697542036, "ground_truth": 0}, {"key": "32292348", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.795658105115675, "ground_truth": 0}, {"key": "32292348", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6791786935246458, "ground_truth": 0}, {"key": "32292348", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7620701055341642, "ground_truth": 0}, {"key": "32292348", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759916584991, "ground_truth": 0}, {"key": "32292348", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494166115292, "ground_truth": 0}, {"key": "20482930", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5234203748122194, "ground_truth": 0}, {"key": "20482930", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6132365495809584, "ground_truth": 0}, {"key": "20482930", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.647798247587656, "ground_truth": 0}, {"key": "20482930", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307820641548, "ground_truth": 0}, {"key": "20482930", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121778247816, "ground_truth": 0}, {"key": "11635754", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7264256244968962, "ground_truth": 0}, {"key": "11635754", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5350984358604732, "ground_truth": 0}, {"key": "11635754", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7490871980226399, "ground_truth": 0}, {"key": "11635754", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511454229853, "ground_truth": 0}, {"key": "11635754", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185944019561769, "ground_truth": 0}, {"key": "40029096", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.638835296413708, "ground_truth": 0}, {"key": "40029096", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7122321972644206, "ground_truth": 0}, {"key": "40029096", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5964331399329733, "ground_truth": 0}, {"key": "40029096", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711829531254, "ground_truth": 0}, {"key": "40029096", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094705789552, "ground_truth": 0}, {"key": "40414719", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9693241989953646, "ground_truth": 0}, {"key": "40414719", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9536217934177937, "ground_truth": 0}, {"key": "40414719", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9394706117185377, "ground_truth": 0}, {"key": "40414719", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872035934366, "ground_truth": 0}, {"key": "40414719", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9511422225480556, "ground_truth": 0}, {"key": "39537616", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7217432054808965, "ground_truth": 0}, {"key": "39537616", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8489722178001242, "ground_truth": 0}, {"key": "39537616", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6406358479977917, "ground_truth": 0}, {"key": "39537616", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239938178241, "ground_truth": 0}, {"key": "39537616", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743661224195, "ground_truth": 0}, {"key": "33245830", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.21469141125793337, "ground_truth": 0}, {"key": "33245830", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.26740816487509605, "ground_truth": 0}, {"key": "33245830", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.22270014076204797, "ground_truth": 0}, {"key": "33245830", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.15507847139783398, "ground_truth": 0}, {"key": "33245830", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814055975260626, "ground_truth": 0}, {"key": "39243601", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7505527630277474, "ground_truth": 0}, {"key": "39243601", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5097644092304398, "ground_truth": 0}, {"key": "39243601", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494467467285, "ground_truth": 0}, {"key": "39243601", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883625928275, "ground_truth": 0}, {"key": "39243601", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195073474693, "ground_truth": 0}, {"key": "35815905", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4111108551104456, "ground_truth": 0}, {"key": "35815905", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5350984217155326, "ground_truth": 0}, {"key": "35815905", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2213506886155715, "ground_truth": 0}, {"key": "35815905", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734874193744, "ground_truth": 0}, {"key": "35815905", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326186775102656, "ground_truth": 0}, {"key": "35260212", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7704647867354408, "ground_truth": 0}, {"key": "35260212", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7008948136329608, "ground_truth": 0}, {"key": "35260212", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7505527698805572, "ground_truth": 0}, {"key": "35260212", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117867424657, "ground_truth": 0}, {"key": "35260212", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197911491977, "ground_truth": 0}, {"key": "39193924", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3684057377843711, "ground_truth": 0}, {"key": "39193924", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4882833764994953, "ground_truth": 0}, {"key": "39193924", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.388618046691933, "ground_truth": 0}, {"key": "39193924", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011666139027, "ground_truth": 0}, {"key": "39193924", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618203166146, "ground_truth": 0}, {"key": "40658569", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.23651622674681722, "ground_truth": 0}, {"key": "40658569", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4687906187967557, "ground_truth": 0}, {"key": "40658569", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794004189519102, "ground_truth": 0}, {"key": "40658569", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298812305516446, "ground_truth": 0}, {"key": "40658569", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4513265351245806, "ground_truth": 0}, {"key": "33497596", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7981867752204448, "ground_truth": 0}, {"key": "33497596", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7534666677988149, "ground_truth": 0}, {"key": "33497596", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.744656372735653, "ground_truth": 0}, {"key": "33497596", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575709395192, "ground_truth": 0}, {"key": "33497596", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430543920404, "ground_truth": 0}, {"key": "40339241", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.675764612254269, "ground_truth": 0}, {"key": "40339241", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7943849482661196, "ground_truth": 0}, {"key": "40339241", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6825737509862654, "ground_truth": 0}, {"key": "40339241", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.774583381108147, "ground_truth": 0}, {"key": "40339241", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982312975337, "ground_truth": 0}, {"key": "31792608", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6992544113395046, "ground_truth": 0}, {"key": "31792608", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7154239942819052, "ground_truth": 0}, {"key": "31792608", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6297746305809439, "ground_truth": 0}, {"key": "31792608", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666527584688, "ground_truth": 0}, {"key": "31792608", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.680878616177632, "ground_truth": 0}, {"key": "33132662", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5621765145791563, "ground_truth": 0}, {"key": "33132662", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.847967758655016, "ground_truth": 0}, {"key": "33132662", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44939264957975417, "ground_truth": 0}, {"key": "33132662", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872370588667, "ground_truth": 0}, {"key": "33132662", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891455561501, "ground_truth": 0}, {"key": "37577457", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5292634009479379, "ground_truth": 0}, {"key": "37577457", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3960681459816613, "ground_truth": 0}, {"key": "37577457", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.60952415015782, "ground_truth": 0}, {"key": "37577457", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640527209354, "ground_truth": 0}, {"key": "37577457", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156198973222214, "ground_truth": 0}, {"key": "38701278", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7634837624859022, "ground_truth": 0}, {"key": "38701278", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8438950983600603, "ground_truth": 0}, {"key": "38701278", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9348724542835053, "ground_truth": 0}, {"key": "38701278", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714933800828, "ground_truth": 0}, {"key": "38701278", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437685195774, "ground_truth": 0}, {"key": "34570783", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9184802446296604, "ground_truth": 0}, {"key": "34570783", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.831143033028873, "ground_truth": 0}, {"key": "34570783", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8976952902214328, "ground_truth": 0}, {"key": "34570783", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673212946343, "ground_truth": 0}, {"key": "34570783", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511453432517, "ground_truth": 0}, {"key": "39064526", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8344069031106717, "ground_truth": 0}, {"key": "39064526", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7106283079662931, "ground_truth": 0}, {"key": "39064526", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8344069029958203, "ground_truth": 0}, {"key": "39064526", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563377317685, "ground_truth": 0}, {"key": "39064526", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850139589952, "ground_truth": 0}, {"key": "40741545", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7090191238723031, "ground_truth": 0}, {"key": "40741545", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7446563336154521, "ground_truth": 0}, {"key": "40741545", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8344068818922651, "ground_truth": 0}, {"key": "40741545", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358328338981, "ground_truth": 0}, {"key": "40741545", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432053259744, "ground_truth": 0}, {"key": "36929751", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9609517109308422, "ground_truth": 0}, {"key": "36929751", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9445872042672148, "ground_truth": 0}, {"key": "36929751", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9603611579301154, "ground_truth": 0}, {"key": "36929751", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.965119110735826, "ground_truth": 0}, {"key": "36929751", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9507778852894823, "ground_truth": 0}, {"key": "23984730", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3056973167982796, "ground_truth": 0}, {"key": "23984730", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.18126320712830155, "ground_truth": 0}, {"key": "23984730", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2643583759750383, "ground_truth": 0}, {"key": "23984730", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231014983365664, "ground_truth": 0}, {"key": "23984730", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2704802177938862, "ground_truth": 0}, {"key": "36007415", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.884039279955637, "ground_truth": 0}, {"key": "36007415", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9588471113886987, "ground_truth": 0}, {"key": "36007415", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9273632911995194, "ground_truth": 0}, {"key": "36007415", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745088781069, "ground_truth": 0}, {"key": "36007415", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9319595753146473, "ground_truth": 0}, {"key": "38875041", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702676321477, "ground_truth": 0}, {"key": "38875041", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9403530581753624, "ground_truth": 0}, {"key": "38875041", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.818736792331367, "ground_truth": 0}, {"key": "38875041", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743776654377, "ground_truth": 0}, {"key": "38875041", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377774268325, "ground_truth": 0}]