[{"key": "35232142", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.10017222317196597, "ground_truth": 0}, {"key": "35232142", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3575675400643844, "ground_truth": 0}, {"key": "35232142", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2658804813772118, "ground_truth": 0}, {"key": "35232142", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091976758277513, "ground_truth": 0}, {"key": "35232142", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193277684269064, "ground_truth": 0}, {"key": "40143035", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7431680357461483, "ground_truth": 0}, {"key": "40143035", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6688802608754517, "ground_truth": 0}, {"key": "40143035", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7606506636934662, "ground_truth": 0}, {"key": "40143035", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210871055268, "ground_truth": 0}, {"key": "40143035", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797495340562, "ground_truth": 0}, {"key": "35951548", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44167303567679306, "ground_truth": 0}, {"key": "35951548", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5312093697406762, "ground_truth": 0}, {"key": "35951548", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.36658973422545477, "ground_truth": 0}, {"key": "35951548", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678278106146, "ground_truth": 0}, {"key": "35951548", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647294934992, "ground_truth": 0}, {"key": "36266422", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6057990364076568, "ground_truth": 0}, {"key": "36266422", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948012325675, "ground_truth": 0}, {"key": "36266422", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5525396982978649, "ground_truth": 0}, {"key": "36266422", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548792916044, "ground_truth": 0}, {"key": "36266422", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441197960993465, "ground_truth": 0}, {"key": "38826984", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5331543927206761, "ground_truth": 0}, {"key": "38826984", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4397473621309395, "ground_truth": 0}, {"key": "38826984", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7025300423728204, "ground_truth": 0}, {"key": "38826984", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.684264043956119, "ground_truth": 0}, {"key": "38826984", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307678726741, "ground_truth": 0}, {"key": "34540833", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7534666590584643, "ground_truth": 0}, {"key": "34540833", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6566582708774753, "ground_truth": 0}, {"key": "34540833", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6150878506130277, "ground_truth": 0}, {"key": "34540833", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.649578653282415, "ground_truth": 0}, {"key": "34540833", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784158383635, "ground_truth": 0}, {"key": "20836172", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031738028214872, "ground_truth": 0}, {"key": "20836172", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8558511603807936, "ground_truth": 0}, {"key": "20836172", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7826624770550411, "ground_truth": 0}, {"key": "20836172", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526205204597, "ground_truth": 0}, {"key": "20836172", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256039614223, "ground_truth": 0}, {"key": "35932467", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5039061706290631, "ground_truth": 0}, {"key": "35932467", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804360638751, "ground_truth": 0}, {"key": "35932467", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49218814505855857, "ground_truth": 0}, {"key": "35932467", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942934955416, "ground_truth": 0}, {"key": "35932467", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878355787568, "ground_truth": 0}, {"key": "40758845", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8529354697477803, "ground_truth": 0}, {"key": "40758845", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6943026629790343, "ground_truth": 0}, {"key": "40758845", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.823328395436136, "ground_truth": 0}, {"key": "40758845", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757645913347304, "ground_truth": 0}, {"key": "40758845", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929075226296, "ground_truth": 0}, {"key": "30358490", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8509647066913454, "ground_truth": 0}, {"key": "30358490", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791787006938123, "ground_truth": 0}, {"key": "30358490", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7918210777981233, "ground_truth": 0}, {"key": "30358490", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288569254888, "ground_truth": 0}, {"key": "30358490", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434897735971, "ground_truth": 0}, {"key": "34615665", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8791467661691542, "ground_truth": 0}, {"key": "34615665", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8688267674270105, "ground_truth": 0}, {"key": "34615665", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8386797710177221, "ground_truth": 0}, {"key": "34615665", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9686195707244826, "ground_truth": 0}, {"key": "34615665", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080766320543, "ground_truth": 0}, {"key": "35890902", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6039318428178905, "ground_truth": 0}, {"key": "35890902", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7074046822909553, "ground_truth": 0}, {"key": "35890902", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6513548676931503, "ground_truth": 0}, {"key": "35890902", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711419975843, "ground_truth": 0}, {"key": "35890902", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620700970449548, "ground_truth": 0}, {"key": "37922330", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7295197733538775, "ground_truth": 0}, {"key": "37922330", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791787137194367, "ground_truth": 0}, {"key": "37922330", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.592666609424412, "ground_truth": 0}, {"key": "37922330", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494351205109, "ground_truth": 0}, {"key": "37922330", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905302994073068, "ground_truth": 0}, {"key": "30844962", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2146914074979939, "ground_truth": 0}, {"key": "30844962", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.413003575657433, "ground_truth": 0}, {"key": "30844962", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358061907741, "ground_truth": 0}, {"key": "30844962", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.22678362544653988, "ground_truth": 0}, {"key": "30844962", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206880613143017, "ground_truth": 0}, {"key": "36217333", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5195212935961612, "ground_truth": 0}, {"key": "36217333", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31912138244811433, "ground_truth": 0}, {"key": "36217333", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5736783766712787, "ground_truth": 0}, {"key": "36217333", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834946192354, "ground_truth": 0}, {"key": "36217333", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883656781362, "ground_truth": 0}, {"key": "30816523", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6893056056162322, "ground_truth": 0}, {"key": "30816523", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4186969194437584, "ground_truth": 0}, {"key": "30816523", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7138307681194388, "ground_truth": 0}, {"key": "30816523", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834695173716, "ground_truth": 0}, {"key": "30816523", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632692513061, "ground_truth": 0}, {"key": "38900884", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8714748646477658, "ground_truth": 0}, {"key": "38900884", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8140528141555717, "ground_truth": 0}, {"key": "38900884", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9334308078404174, "ground_truth": 0}, {"key": "38900884", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256382017709, "ground_truth": 0}, {"key": "38900884", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511560214632, "ground_truth": 0}, {"key": "13890581", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8175744818023014, "ground_truth": 0}, {"key": "13890581", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6297746085478583, "ground_truth": 0}, {"key": "13890581", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7931059627430032, "ground_truth": 0}, {"key": "13890581", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721956966894, "ground_truth": 0}, {"key": "13890581", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046967592936, "ground_truth": 0}, {"key": "40194700", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.862467530855967, "ground_truth": 0}, {"key": "40194700", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8998277812859965, "ground_truth": 0}, {"key": "40194700", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8278281765720528, "ground_truth": 0}, {"key": "40194700", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797132978823, "ground_truth": 0}, {"key": "40194700", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9690910394464145, "ground_truth": 0}, {"key": "37903647", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36116473330613996, "ground_truth": 0}, {"key": "37903647", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5331544072073477, "ground_truth": 0}, {"key": "37903647", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2751297069663779, "ground_truth": 0}, {"key": "37903647", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487178763985, "ground_truth": 0}, {"key": "37903647", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519860998137046, "ground_truth": 0}, {"key": "13291223", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5409238449661923, "ground_truth": 0}, {"key": "13291223", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5253688330909317, "ground_truth": 0}, {"key": "13291223", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5214711701184375, "ground_truth": 0}, {"key": "13291223", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033869870215, "ground_truth": 0}, {"key": "13291223", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218814748621126, "ground_truth": 0}, {"key": "36052570", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3942009730505387, "ground_truth": 0}, {"key": "36052570", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6261241778089521, "ground_truth": 0}, {"key": "36052570", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6723316821378046, "ground_truth": 0}, {"key": "36052570", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828337972680913, "ground_truth": 0}, {"key": "36052570", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167934479926, "ground_truth": 0}, {"key": "34944735", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6150878790773349, "ground_truth": 0}, {"key": "34944735", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5736784364372028, "ground_truth": 0}, {"key": "34944735", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5755880264874067, "ground_truth": 0}, {"key": "34944735", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073814463216, "ground_truth": 0}, {"key": "34944735", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734655634403, "ground_truth": 0}, {"key": "32159602", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.23792990194308003, "ground_truth": 0}, {"key": "32159602", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5964331511099287, "ground_truth": 0}, {"key": "32159602", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4282333852462756, "ground_truth": 0}, {"key": "32159602", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740816114595317, "ground_truth": 0}, {"key": "32159602", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455895840452, "ground_truth": 0}, {"key": "34988915", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.42823339075459854, "ground_truth": 0}, {"key": "34988915", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40168778604660393, "ground_truth": 0}, {"key": "34988915", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4902356316969404, "ground_truth": 0}, {"key": "34988915", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448014204916756, "ground_truth": 0}, {"key": "34988915", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834850384076, "ground_truth": 0}, {"key": "37889203", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.924687694550682, "ground_truth": 0}, {"key": "37889203", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.904650535078335, "ground_truth": 0}, {"key": "37889203", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8397339587577677, "ground_truth": 0}, {"key": "37889203", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148239897887, "ground_truth": 0}, {"key": "37889203", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952862602127, "ground_truth": 0}, {"key": "33609927", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4590761191620807, "ground_truth": 0}, {"key": "33609927", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.579400423665084, "ground_truth": 0}, {"key": "33609927", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4073334014499838, "ground_truth": 0}, {"key": "33609927", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331318918858, "ground_truth": 0}, {"key": "33609927", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311800598246, "ground_truth": 0}, {"key": "33578778", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6206216430769522, "ground_truth": 0}, {"key": "33578778", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7248702599912826, "ground_truth": 0}, {"key": "33578778", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7185944054546041, "ground_truth": 0}, {"key": "33578778", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.626124152113456, "ground_truth": 0}, {"key": "33578778", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358419987181, "ground_truth": 0}, {"key": "36888270", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8080672245769518, "ground_truth": 0}, {"key": "36888270", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5755880002703316, "ground_truth": 0}, {"key": "36888270", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7446563567102892, "ground_truth": 0}, {"key": "36888270", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343838508606, "ground_truth": 0}, {"key": "36888270", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253777521638, "ground_truth": 0}, {"key": "36846007", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9511422167665227, "ground_truth": 0}, {"key": "36846007", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9755769090080744, "ground_truth": 0}, {"key": "36846007", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9420819112746647, "ground_truth": 0}, {"key": "36846007", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9362850031818433, "ground_truth": 0}, {"key": "36846007", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.950410972800305, "ground_truth": 0}, {"key": "31723471", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7505527529721175, "ground_truth": 0}, {"key": "31723471", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6460136870814067, "ground_truth": 0}, {"key": "31723471", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774740235785153, "ground_truth": 0}, {"key": "31723471", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047013320256, "ground_truth": 0}, {"key": "31723471", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928976210845, "ground_truth": 0}, {"key": "15921828", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3174262759318506, "ground_truth": 0}, {"key": "15921828", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35042136790341, "ground_truth": 0}, {"key": "15921828", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2942149822289192, "ground_truth": 0}, {"key": "15921828", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262630708749, "ground_truth": 0}, {"key": "15921828", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692580248652, "ground_truth": 0}, {"key": "39109408", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.31237002462833885, "ground_truth": 0}, {"key": "39109408", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2861692592667364, "ground_truth": 0}, {"key": "39109408", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3363310397428239, "ground_truth": 0}, {"key": "39109408", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647248842632, "ground_truth": 0}, {"key": "39109408", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239109010362347, "ground_truth": 0}, {"key": "20936833", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.15002881415203947, "ground_truth": 0}, {"key": "20936833", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.09602549592251454, "ground_truth": 0}, {"key": "20936833", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.0933468843868593, "ground_truth": 0}, {"key": "20936833", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.08756383744266133, "ground_truth": 0}, {"key": "20936833", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.18010666229807817, "ground_truth": 0}, {"key": "36832879", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5544704720694758, "ground_truth": 0}, {"key": "36832879", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6495786174531029, "ground_truth": 0}, {"key": "36832879", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6757645961542043, "ground_truth": 0}, {"key": "36832879", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.529263378505084, "ground_truth": 0}, {"key": "36832879", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633152397583146, "ground_truth": 0}, {"key": "14958201", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.812867318458966, "ground_truth": 0}, {"key": "14958201", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7732163693874003, "ground_truth": 0}, {"key": "14958201", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8140528043729571, "ground_truth": 0}, {"key": "14958201", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951021471206, "ground_truth": 0}, {"key": "14958201", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107899715135, "ground_truth": 0}, {"key": "34352262", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1470645372636678, "ground_truth": 0}, {"key": "34352262", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.24508500969845984, "ground_truth": 0}, {"key": "34352262", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2689414565846982, "ground_truth": 0}, {"key": "34352262", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.12336561091828291, "ground_truth": 0}, {"key": "34352262", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.11920292637149973, "ground_truth": 0}, {"key": "39805395", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45713670527424616, "ground_truth": 0}, {"key": "39805395", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.29583987492162894, "ground_truth": 0}, {"key": "39805395", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30569734249728525, "ground_truth": 0}, {"key": "39805395", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800920334745, "ground_truth": 0}, {"key": "39805395", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658973193165817, "ground_truth": 0}, {"key": "34303109", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.21733751277166796, "ground_truth": 0}, {"key": "34303109", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.24220561830682066, "ground_truth": 0}, {"key": "34303109", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30902372493332436, "ground_truth": 0}, {"key": "34303109", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242354044412439, "ground_truth": 0}, {"key": "34303109", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610082913036, "ground_truth": 0}, {"key": "39939090", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9046505411835513, "ground_truth": 0}, {"key": "39939090", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8489721947152558, "ground_truth": 0}, {"key": "39939090", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9026095965531004, "ground_truth": 0}, {"key": "39939090", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.823328412319055, "ground_truth": 0}, {"key": "39939090", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920200976073, "ground_truth": 0}, {"key": "29347771", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7786493048408341, "ground_truth": 0}, {"key": "29347771", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948115400125, "ground_truth": 0}, {"key": "29347771", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8723473741298413, "ground_truth": 0}, {"key": "29347771", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721915581846, "ground_truth": 0}, {"key": "29347771", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701069099337, "ground_truth": 0}, {"key": "36783415", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7839884694898104, "ground_truth": 0}, {"key": "36783415", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5736783810163938, "ground_truth": 0}, {"key": "36783415", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059239732744, "ground_truth": 0}, {"key": "36783415", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526366713399, "ground_truth": 0}, {"key": "36783415", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398146828137235, "ground_truth": 0}, {"key": "37935687", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7041601457510123, "ground_truth": 0}, {"key": "37935687", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7718434974058349, "ground_truth": 0}, {"key": "37935687", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7905303233051163, "ground_truth": 0}, {"key": "37935687", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228134933263, "ground_truth": 0}, {"key": "37935687", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511516911679, "ground_truth": 0}, {"key": "40260829", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7356416251432283, "ground_truth": 0}, {"key": "40260829", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8539127463025491, "ground_truth": 0}, {"key": "40260829", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8749346150271373, "ground_truth": 0}, {"key": "40260829", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388016189497, "ground_truth": 0}, {"key": "40260829", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215481576503, "ground_truth": 0}, {"key": "36478199", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7057850258953433, "ground_truth": 0}, {"key": "36478199", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7090191471191869, "ground_truth": 0}, {"key": "36478199", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.658417501650356, "ground_truth": 0}, {"key": "36478199", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891180477537, "ground_truth": 0}, {"key": "36478199", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786040746863, "ground_truth": 0}, {"key": "34541803", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.43782350503777606, "ground_truth": 0}, {"key": "34541803", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4320633733932857, "ground_truth": 0}, {"key": "34541803", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43014735134953463, "ground_truth": 0}, {"key": "34541803", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704636607997, "ground_truth": 0}, {"key": "34541803", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.656658273516829, "ground_truth": 0}, {"key": "35360841", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7813306227601273, "ground_truth": 0}, {"key": "35360841", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6959583323354973, "ground_truth": 0}, {"key": "35360841", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8840392813022697, "ground_truth": 0}, {"key": "35360841", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185816275533, "ground_truth": 0}, {"key": "35360841", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867627582218, "ground_truth": 0}, {"key": "35550407", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4282333580938763, "ground_truth": 0}, {"key": "35550407", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6495786373049516, "ground_truth": 0}, {"key": "35550407", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4765796371547135, "ground_truth": 0}, {"key": "35550407", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365688825034, "ground_truth": 0}, {"key": "35550407", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819791212375, "ground_truth": 0}, {"key": "37561590", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8529354966820402, "ground_truth": 0}, {"key": "37561590", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8558511651050541, "ground_truth": 0}, {"key": "37561590", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8872046039625953, "ground_truth": 0}, {"key": "37561590", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056163337057, "ground_truth": 0}, {"key": "37561590", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303261343447, "ground_truth": 0}, {"key": "39328843", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9362849999001377, "ground_truth": 0}, {"key": "39328843", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9213576261835992, "ground_truth": 0}, {"key": "39328843", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9425067186887917, "ground_truth": 0}, {"key": "39328843", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933746274539, "ground_truth": 0}, {"key": "39328843", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9582261136643573, "ground_truth": 0}, {"key": "35389665", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9704646615162581, "ground_truth": 0}, {"key": "35389665", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9700134935898725, "ground_truth": 0}, {"key": "35389665", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9669140180599826, "ground_truth": 0}, {"key": "35389665", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9711290929544012, "ground_truth": 0}, {"key": "35389665", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9690910410300514, "ground_truth": 0}, {"key": "33080187", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33633104952457943, "ground_truth": 0}, {"key": "33080187", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.23934933560718089, "ground_truth": 0}, {"key": "33080187", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.10594827230145522, "ground_truth": 0}, {"key": "33080187", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405756483052532, "ground_truth": 0}, {"key": "33080187", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982762315823106, "ground_truth": 0}, {"key": "38636995", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6261241757260857, "ground_truth": 0}, {"key": "38636995", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7371581723045583, "ground_truth": 0}, {"key": "38636995", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7386690787860599, "ground_truth": 0}, {"key": "38636995", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358475353228, "ground_truth": 0}, {"key": "38636995", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307369415635, "ground_truth": 0}, {"key": "18536236", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6654105775746287, "ground_truth": 0}, {"key": "18536236", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5679365892207722, "ground_truth": 0}, {"key": "18536236", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5389832093936172, "ground_truth": 0}, {"key": "18536236", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105474895676, "ground_truth": 0}, {"key": "18536236", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381214309407, "ground_truth": 0}, {"key": "36289151", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4941408810900663, "ground_truth": 0}, {"key": "36289151", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7025300429064624, "ground_truth": 0}, {"key": "36289151", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6688802398051362, "ground_truth": 0}, {"key": "36289151", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047217801501, "ground_truth": 0}, {"key": "36289151", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802819891768, "ground_truth": 0}, {"key": "23017045", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7233094754771379, "ground_truth": 0}, {"key": "23017045", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506657574054, "ground_truth": 0}, {"key": "23017045", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6548947620452578, "ground_truth": 0}, {"key": "23017045", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759753104393, "ground_truth": 0}, {"key": "23017045", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759681554683, "ground_truth": 0}, {"key": "36418082", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8019358243764564, "ground_truth": 0}, {"key": "36418082", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6909762986349234, "ground_truth": 0}, {"key": "36418082", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7008947843860135, "ground_truth": 0}, {"key": "36418082", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056322015809438, "ground_truth": 0}, {"key": "36418082", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646202968487, "ground_truth": 0}, {"key": "34396551", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4902356225798751, "ground_truth": 0}, {"key": "34396551", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5926665972457777, "ground_truth": 0}, {"key": "34396551", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6671476693192477, "ground_truth": 0}, {"key": "34396551", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610168042956875, "ground_truth": 0}, {"key": "34396551", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796273757841, "ground_truth": 0}, {"key": "39720944", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9429286004986543, "ground_truth": 0}, {"key": "39720944", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9458012709797047, "ground_truth": 0}, {"key": "39720944", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9230391695623886, "ground_truth": 0}, {"key": "39720944", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9532750447387983, "ground_truth": 0}, {"key": "39720944", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619265902314, "ground_truth": 0}, {"key": "35884842", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41111087509335403, "ground_truth": 0}, {"key": "35884842", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5660185502773197, "ground_truth": 0}, {"key": "35884842", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3433417245671878, "ground_truth": 0}, {"key": "35884842", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36477754872648716, "ground_truth": 0}, {"key": "35884842", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526704115587, "ground_truth": 0}, {"key": "35403375", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.31912139449415566, "ground_truth": 0}, {"key": "35403375", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3793783684592044, "ground_truth": 0}, {"key": "35403375", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3629691993279651, "ground_truth": 0}, {"key": "35403375", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334172578871053, "ground_truth": 0}, {"key": "35403375", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416844947873, "ground_truth": 0}, {"key": "26341324", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9111797099549617, "ground_truth": 0}, {"key": "26341324", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9105454047544551, "ground_truth": 0}, {"key": "26341324", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8221891451301954, "ground_truth": 0}, {"key": "26341324", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545621191584, "ground_truth": 0}, {"key": "26341324", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819592673215, "ground_truth": 0}, {"key": "19212345", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9299510393379754, "ground_truth": 0}, {"key": "19212345", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8469578333184884, "ground_truth": 0}, {"key": "19212345", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6876300125216877, "ground_truth": 0}, {"key": "19212345", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972678057525, "ground_truth": 0}, {"key": "19212345", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970740793384, "ground_truth": 0}, {"key": "30548367", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.726425619949863, "ground_truth": 0}, {"key": "30548367", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7592254010870857, "ground_truth": 0}, {"key": "30548367", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.879146763629995, "ground_truth": 0}, {"key": "30548367", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802253027386, "ground_truth": 0}, {"key": "30548367", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825896707171, "ground_truth": 0}, {"key": "37919402", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9202179818741704, "ground_truth": 0}, {"key": "37919402", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9339146215972775, "ground_truth": 0}, {"key": "37919402", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8872045899006326, "ground_truth": 0}, {"key": "37919402", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677454461386, "ground_truth": 0}, {"key": "37919402", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9353465182555644, "ground_truth": 0}, {"key": "39995133", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9230391577402618, "ground_truth": 0}, {"key": "39995133", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9477691425105209, "ground_truth": 0}, {"key": "39995133", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9465966690911177, "ground_truth": 0}, {"key": "39995133", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9556514191660784, "ground_truth": 0}, {"key": "39995133", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149009757324, "ground_truth": 0}, {"key": "40249088", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6279512142856295, "ground_truth": 0}, {"key": "40249088", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8606036113072825, "ground_truth": 0}, {"key": "40249088", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5794003998581998, "ground_truth": 0}, {"key": "40249088", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.672331701806542, "ground_truth": 0}, {"key": "40249088", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085639306779, "ground_truth": 0}, {"key": "40254388", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5097643665457364, "ground_truth": 0}, {"key": "40254388", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6424324534907181, "ground_truth": 0}, {"key": "40254388", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.613236591465503, "ground_truth": 0}, {"key": "40254388", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494690869643, "ground_truth": 0}, {"key": "40254388", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442250910817845, "ground_truth": 0}, {"key": "31995230", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9105453954985406, "ground_truth": 0}, {"key": "31995230", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7918210754425601, "ground_truth": 0}, {"key": "31995230", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8895288513820754, "ground_truth": 0}, {"key": "31995230", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691410973219, "ground_truth": 0}, {"key": "31995230", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9445872102654879, "ground_truth": 0}, {"key": "38632129", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8895288424350336, "ground_truth": 0}, {"key": "38632129", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8895288476578606, "ground_truth": 0}, {"key": "38632129", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9385759651625394, "ground_truth": 0}, {"key": "38632129", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9329437164345452, "ground_truth": 0}, {"key": "38632129", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942055160097, "ground_truth": 0}, {"key": "35720795", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.721743219563112, "ground_truth": 0}, {"key": "35720795", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7905303195956112, "ground_truth": 0}, {"key": "35720795", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7295197902647594, "ground_truth": 0}, {"key": "35720795", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278799059417, "ground_truth": 0}, {"key": "35720795", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435018525377, "ground_truth": 0}, {"key": "23906759", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8548846308776191, "ground_truth": 0}, {"key": "23906759", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7931059520018507, "ground_truth": 0}, {"key": "23906759", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8459424446785732, "ground_truth": 0}, {"key": "23906759", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9289263297631389, "ground_truth": 0}, {"key": "23906759", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8933094081328417, "ground_truth": 0}, {"key": "19410108", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7233094624237496, "ground_truth": 0}, {"key": "19410108", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9026096066035475, "ground_truth": 0}, {"key": "19410108", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7549149780103667, "ground_truth": 0}, {"key": "19410108", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689520754725, "ground_truth": 0}, {"key": "19410108", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581518123549, "ground_truth": 0}, {"key": "30745137", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.370225377762172, "ground_truth": 0}, {"key": "30745137", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31573598121202257, "ground_truth": 0}, {"key": "30745137", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5926666254646266, "ground_truth": 0}, {"key": "30745137", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195375892906, "ground_truth": 0}, {"key": "30745137", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708696431099, "ground_truth": 0}, {"key": "26553115", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.24077459824901068, "ground_truth": 0}, {"key": "26553115", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.24653334270772484, "ground_truth": 0}, {"key": "26553115", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.519521328146982, "ground_truth": 0}, {"key": "26553115", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632160002389263, "ground_truth": 0}, {"key": "26553115", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416791376345, "ground_truth": 0}, {"key": "37872311", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8879840521826853, "ground_truth": 0}, {"key": "37872311", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7431680228529494, "ground_truth": 0}, {"key": "37872311", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8757869871609729, "ground_truth": 0}, {"key": "37872311", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.925768631581579, "ground_truth": 0}, {"key": "37872311", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772228265767, "ground_truth": 0}, {"key": "35553131", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8962513764176469, "ground_truth": 0}, {"key": "35553131", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8749346223419232, "ground_truth": 0}, {"key": "35553131", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7969253805139678, "ground_truth": 0}, {"key": "35553131", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.84997117326977, "ground_truth": 0}, {"key": "35553131", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467774799016, "ground_truth": 0}, {"key": "39038936", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5175708598472114, "ground_truth": 0}, {"key": "39038936", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7786493193596385, "ground_truth": 0}, {"key": "39038936", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6095241593369625, "ground_truth": 0}, {"key": "39038936", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512503997088, "ground_truth": 0}, {"key": "39038936", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269954679264, "ground_truth": 0}, {"key": "38735486", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9788748084726172, "ground_truth": 0}, {"key": "38735486", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9888419691096437, "ground_truth": 0}, {"key": "38735486", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9750122040870133, "ground_truth": 0}, {"key": "38735486", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9876638989301698, "ground_truth": 0}, {"key": "38735486", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9740426420730645, "ground_truth": 0}, {"key": "17087845", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47073660793686956, "ground_truth": 0}, {"key": "17087845", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43206338239006453, "ground_truth": 0}, {"key": "17087845", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370307801923493, "ground_truth": 0}, {"key": "17087845", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213023379406, "ground_truth": 0}, {"key": "17087845", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738758291425726, "ground_truth": 0}, {"key": "37443011", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7371581606528034, "ground_truth": 0}, {"key": "37443011", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9118099639204965, "ground_truth": 0}, {"key": "37443011", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6757646146111371, "ground_truth": 0}, {"key": "37443011", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215364095828, "ground_truth": 0}, {"key": "37443011", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461390156000557, "ground_truth": 0}, {"key": "36855749", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8606036317202802, "ground_truth": 0}, {"key": "36855749", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8933094080963174, "ground_truth": 0}, {"key": "36855749", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8255897220438588, "ground_truth": 0}, {"key": "36855749", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897287329907, "ground_truth": 0}, {"key": "36855749", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951052843774, "ground_truth": 0}, {"key": "35613141", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8198933231151354, "ground_truth": 0}, {"key": "35613141", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085856208566, "ground_truth": 0}, {"key": "35613141", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8661325198737131, "ground_truth": 0}, {"key": "35613141", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849641389731, "ground_truth": 0}, {"key": "35613141", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445757497806, "ground_truth": 0}, {"key": "39088847", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "39088847", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.49804688041516454, "ground_truth": 0}, {"key": "39088847", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.517570878210411, "ground_truth": 0}, {"key": "39088847", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398630174151474, "ground_truth": 0}, {"key": "39088847", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.28937169406194, "ground_truth": 0}, {"key": "33197277", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6039318328287065, "ground_truth": 0}, {"key": "33197277", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8300437718689928, "ground_truth": 0}, {"key": "33197277", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9161096085150177, "ground_truth": 0}, {"key": "33197277", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797746112742, "ground_truth": 0}, {"key": "33197277", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767914345392, "ground_truth": 0}, {"key": "33815489", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36477755472237233, "ground_truth": 0}, {"key": "33815489", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4980468725989578, "ground_truth": 0}, {"key": "33815489", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4707366226634524, "ground_truth": 0}, {"key": "33815489", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3665897263255729, "ground_truth": 0}, {"key": "33815489", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668455905937855, "ground_truth": 0}, {"key": "35862754", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.872347379221723, "ground_truth": 0}, {"key": "35862754", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9324533107548274, "ground_truth": 0}, {"key": "35862754", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063802723052, "ground_truth": 0}, {"key": "35862754", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149066218061, "ground_truth": 0}, {"key": "35862754", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149066675337, "ground_truth": 0}, {"key": "36080615", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2877678220501446, "ground_truth": 0}, {"key": "36080615", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4359015090015756, "ground_truth": 0}, {"key": "36080615", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3960681645075967, "ground_truth": 0}, {"key": "36080615", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765197724253, "ground_truth": 0}, {"key": "36080615", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953713740397, "ground_truth": 0}, {"key": "22822742", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8947894568605712, "ground_truth": 0}, {"key": "22822742", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8902942241525451, "ground_truth": 0}, {"key": "22822742", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9099070069423292, "ground_truth": 0}, {"key": "22822742", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587772177555, "ground_truth": 0}, {"key": "22822742", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070057901745, "ground_truth": 0}, {"key": "39747536", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8198933381202302, "ground_truth": 0}, {"key": "39747536", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7732163696705523, "ground_truth": 0}, {"key": "39747536", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.79692538045021, "ground_truth": 0}, {"key": "39747536", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933425659187, "ground_truth": 0}, {"key": "39747536", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528096298913, "ground_truth": 0}, {"key": "34218396", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7759445386193193, "ground_truth": 0}, {"key": "34218396", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7461390019094485, "ground_truth": 0}, {"key": "34218396", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8969755737122985, "ground_truth": 0}, {"key": "34218396", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631593997056, "ground_truth": 0}, {"key": "34218396", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473755251201, "ground_truth": 0}, {"key": "39150388", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5832033299330727, "ground_truth": 0}, {"key": "39150388", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5486734996038197, "ground_truth": 0}, {"key": "39150388", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5331544123987513, "ground_truth": 0}, {"key": "39150388", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397216732896, "ground_truth": 0}, {"key": "39150388", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015190964715, "ground_truth": 0}, {"key": "28765782", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8300437891804888, "ground_truth": 0}, {"key": "28765782", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8365545572968672, "ground_truth": 0}, {"key": "28765782", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8322366506774825, "ground_truth": 0}, {"key": "28765782", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185853078698, "ground_truth": 0}, {"key": "28765782", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867685839632, "ground_truth": 0}, {"key": "35828022", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6406358383565923, "ground_truth": 0}, {"key": "35828022", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6057990684841487, "ground_truth": 0}, {"key": "35828022", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.868826780161714, "ground_truth": 0}, {"key": "35828022", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493305190246, "ground_truth": 0}, {"key": "35828022", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.81167601208165, "ground_truth": 0}, {"key": "27717735", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7371581442702079, "ground_truth": 0}, {"key": "27717735", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7279754319182011, "ground_truth": 0}, {"key": "27717735", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.509764388606138, "ground_truth": 0}, {"key": "27717735", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419745743477, "ground_truth": 0}, {"key": "27717735", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666525489315, "ground_truth": 0}, {"key": "37977826", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6095241645552231, "ground_truth": 0}, {"key": "37977826", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4863315637892972, "ground_truth": 0}, {"key": "37977826", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41111088022342085, "ground_truth": 0}, {"key": "37977826", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802608292365, "ground_truth": 0}, {"key": "37977826", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058590904876702, "ground_truth": 0}, {"key": "31768588", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9219218390973674, "ground_truth": 0}, {"key": "31768588", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.953966099663923, "ground_truth": 0}, {"key": "31768588", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.893309407387116, "ground_truth": 0}, {"key": "31768588", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148151917142, "ground_truth": 0}, {"key": "31768588", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297800488816, "ground_truth": 0}, {"key": "37183351", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.42441197452692087, "ground_truth": 0}, {"key": "37183351", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3056973319025339, "ground_truth": 0}, {"key": "37183351", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5428633034112378, "ground_truth": 0}, {"key": "37183351", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711473614801, "ground_truth": 0}, {"key": "37183351", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101677373973377, "ground_truth": 0}, {"key": "39622090", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5945512360805519, "ground_truth": 0}, {"key": "39622090", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.583203343814971, "ground_truth": 0}, {"key": "39622090", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6076631578120338, "ground_truth": 0}, {"key": "39622090", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.45326183703464334, "ground_truth": 0}, {"key": "39622090", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035883033297, "ground_truth": 0}, {"key": "39272756", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6113819908891008, "ground_truth": 0}, {"key": "39272756", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251342264735, "ground_truth": 0}, {"key": "39272756", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4551986268981409, "ground_truth": 0}, {"key": "39272756", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504970998676, "ground_truth": 0}, {"key": "39272756", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689507209431, "ground_truth": 0}, {"key": "32138822", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6406358490365307, "ground_truth": 0}, {"key": "32138822", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6893056193159762, "ground_truth": 0}, {"key": "32138822", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5350984591421202, "ground_truth": 0}, {"key": "32138822", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122918026395, "ground_truth": 0}, {"key": "32138822", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933371903726, "ground_truth": 0}, {"key": "31070114", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.21601153458029507, "ground_truth": 0}, {"key": "31070114", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.22541661131475874, "ground_truth": 0}, {"key": "31070114", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.21601153945623686, "ground_truth": 0}, {"key": "31070114", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720751523983, "ground_truth": 0}, {"key": "31070114", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.28140560880670623, "ground_truth": 0}, {"key": "39652762", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8816149080506731, "ground_truth": 0}, {"key": "39652762", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.856812286610704, "ground_truth": 0}, {"key": "39652762", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8783142432174996, "ground_truth": 0}, {"key": "39652762", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898672826823, "ground_truth": 0}, {"key": "39652762", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.724870258844189, "ground_truth": 0}, {"key": "33258866", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.548673484801558, "ground_truth": 0}, {"key": "33258866", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6959583309497843, "ground_truth": 0}, {"key": "33258866", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5389832165614815, "ground_truth": 0}, {"key": "33258866", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381537304994, "ground_truth": 0}, {"key": "33258866", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011544015301, "ground_truth": 0}, {"key": "36962388", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7662936405479033, "ground_truth": 0}, {"key": "36962388", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.46879062110352554, "ground_truth": 0}, {"key": "36962388", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7154240143562823, "ground_truth": 0}, {"key": "36962388", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106283088196833, "ground_truth": 0}, {"key": "36962388", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283173055445, "ground_truth": 0}, {"key": "32282272", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.18952107664108406, "ground_truth": 0}, {"key": "32282272", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.22405544722342602, "ground_truth": 0}, {"key": "32282272", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.35398631639130285, "ground_truth": 0}, {"key": "32282272", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667539112774415, "ground_truth": 0}, {"key": "32282272", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.27669051872716566, "ground_truth": 0}, {"key": "36093072", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9124361671314077, "ground_truth": 0}, {"key": "36093072", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9161096191943602, "ground_truth": 0}, {"key": "36093072", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.907312218167489, "ground_truth": 0}, {"key": "36093072", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.955319131234339, "ground_truth": 0}, {"key": "36093072", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.939913355561275, "ground_truth": 0}, {"key": "38879972", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6242935473643291, "ground_truth": 0}, {"key": "38879972", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7154239778711705, "ground_truth": 0}, {"key": "38879972", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365626360254, "ground_truth": 0}, {"key": "38879972", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998610964021, "ground_truth": 0}, {"key": "38879972", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381737805622, "ground_truth": 0}, {"key": "32106473", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.567936629089363, "ground_truth": 0}, {"key": "32106473", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251157039355, "ground_truth": 0}, {"key": "32106473", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.611381975094644, "ground_truth": 0}, {"key": "32106473", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545767769681, "ground_truth": 0}, {"key": "32106473", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195153693175, "ground_truth": 0}, {"key": "40415815", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5926666071175467, "ground_truth": 0}, {"key": "40415815", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6495786220558926, "ground_truth": 0}, {"key": "40415815", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5156199318004189, "ground_truth": 0}, {"key": "40415815", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269865327761, "ground_truth": 0}, {"key": "40415815", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297745998559138, "ground_truth": 0}, {"key": "34581918", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.56025266963503, "ground_truth": 0}, {"key": "34581918", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6224593537018015, "ground_truth": 0}, {"key": "34581918", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5234203560687677, "ground_truth": 0}, {"key": "34581918", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563486488802, "ground_truth": 0}, {"key": "34581918", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918110761517, "ground_truth": 0}, {"key": "33004157", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8947894569965752, "ground_truth": 0}, {"key": "33004157", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7892337161458679, "ground_truth": 0}, {"key": "33004157", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8816149150110018, "ground_truth": 0}, {"key": "33004157", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531190248334, "ground_truth": 0}, {"key": "33004157", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366544296225, "ground_truth": 0}, {"key": "30334943", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.860603623857085, "ground_truth": 0}, {"key": "30334943", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8816149005368793, "ground_truth": 0}, {"key": "30334943", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8824278555774097, "ground_truth": 0}, {"key": "30334943", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215265092584, "ground_truth": 0}, {"key": "30334943", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580822858016, "ground_truth": 0}, {"key": "33280503", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.420599600904049, "ground_truth": 0}, {"key": "33280503", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42441198617946047, "ground_truth": 0}, {"key": "33280503", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2146914096983748, "ground_truth": 0}, {"key": "33280503", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092207973495019, "ground_truth": 0}, {"key": "33280503", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237143403963, "ground_truth": 0}, {"key": "25726782", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8749346206417409, "ground_truth": 0}, {"key": "25726782", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8418256460466241, "ground_truth": 0}, {"key": "25726782", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.931462505154818, "ground_truth": 0}, {"key": "25726782", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382254778505, "ground_truth": 0}, {"key": "25726782", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392809109963, "ground_truth": 0}, {"key": "35479854", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6859494578074392, "ground_truth": 0}, {"key": "35479854", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7106282790611834, "ground_truth": 0}, {"key": "35479854", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8233283919652586, "ground_truth": 0}, {"key": "35479854", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187368104316797, "ground_truth": 0}, {"key": "35479854", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358537681449, "ground_truth": 0}, {"key": "32716226", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802588298016, "ground_truth": 0}, {"key": "32716226", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544330602021, "ground_truth": 0}, {"key": "32716226", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5698526642265896, "ground_truth": 0}, {"key": "32716226", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476935900159, "ground_truth": 0}, {"key": "32716226", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544168029811, "ground_truth": 0}, {"key": "37047554", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6584175047794996, "ground_truth": 0}, {"key": "37047554", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2583259877561722, "ground_truth": 0}, {"key": "37047554", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.35936415242859726, "ground_truth": 0}, {"key": "37047554", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262828604598, "ground_truth": 0}, {"key": "37047554", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37570645047558265, "ground_truth": 0}, {"key": "36565290", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.943763655107771, "ground_truth": 0}, {"key": "36565290", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8848377771561506, "ground_truth": 0}, {"key": "36565290", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8969755699333358, "ground_truth": 0}, {"key": "36565290", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625256764926, "ground_truth": 0}, {"key": "36565290", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240146849331, "ground_truth": 0}, {"key": "27758640", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6876299797457079, "ground_truth": 0}, {"key": "27758640", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804629741289, "ground_truth": 0}, {"key": "27758640", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7592254048009304, "ground_truth": 0}, {"key": "27758640", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434893647684, "ground_truth": 0}, {"key": "27758640", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149759643918, "ground_truth": 0}, {"key": "28897118", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5350984270788814, "ground_truth": 0}, {"key": "28897118", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3311197328350672, "ground_truth": 0}, {"key": "28897118", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39420094310812825, "ground_truth": 0}, {"key": "28897118", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011775921008, "ground_truth": 0}, {"key": "28897118", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199347212351, "ground_truth": 0}, {"key": "38452661", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9651191160163817, "ground_truth": 0}, {"key": "38452661", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9184802442551675, "ground_truth": 0}, {"key": "38452661", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8661325275349411, "ground_truth": 0}, {"key": "38452661", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846212916292, "ground_truth": 0}, {"key": "38452661", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737301731765, "ground_truth": 0}, {"key": "38033492", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575637596883, "ground_truth": 0}, {"key": "38033492", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4960938085805121, "ground_truth": 0}, {"key": "38033492", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7185943904433971, "ground_truth": 0}, {"key": "38033492", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998538262843, "ground_truth": 0}, {"key": "38033492", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.832236666244993, "ground_truth": 0}, {"key": "35949555", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8596637514510783, "ground_truth": 0}, {"key": "35949555", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8947894591140059, "ground_truth": 0}, {"key": "35949555", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9385759596475874, "ground_truth": 0}, {"key": "35949555", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.887984047825862, "ground_truth": 0}, {"key": "35949555", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096123705478, "ground_truth": 0}, {"key": "15263826", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7446563482984054, "ground_truth": 0}, {"key": "15263826", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5467381651653279, "ground_truth": 0}, {"key": "15263826", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7386690683846833, "ground_truth": 0}, {"key": "15263826", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754529778633, "ground_truth": 0}, {"key": "15263826", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239794948843, "ground_truth": 0}, {"key": "37313866", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9066531277857123, "ground_truth": 0}, {"key": "37313866", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5621765180145257, "ground_truth": 0}, {"key": "37313866", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6842640361749447, "ground_truth": 0}, {"key": "37313866", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159293652915, "ground_truth": 0}, {"key": "37313866", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476547823503, "ground_truth": 0}, {"key": "13911157", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8925625174838588, "ground_truth": 0}, {"key": "13911157", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9539661012661057, "ground_truth": 0}, {"key": "13911157", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9367494812477208, "ground_truth": 0}, {"key": "13911157", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352779200593, "ground_truth": 0}, {"key": "13911157", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510454167614, "ground_truth": 0}, {"key": "39594894", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7264255923154816, "ground_truth": 0}, {"key": "39594894", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6909763050451027, "ground_truth": 0}, {"key": "39594894", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4397473649778466, "ground_truth": 0}, {"key": "39594894", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106282888703146, "ground_truth": 0}, {"key": "39594894", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.594551268045161, "ground_truth": 0}, {"key": "34096170", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.68426402250978, "ground_truth": 0}, {"key": "34096170", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8418256465765938, "ground_truth": 0}, {"key": "34096170", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8887587933892661, "ground_truth": 0}, {"key": "34096170", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358527914106, "ground_truth": 0}, {"key": "34096170", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059156387451, "ground_truth": 0}, {"key": "37891952", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9793540710089057, "ground_truth": 0}, {"key": "37891952", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9722043779681736, "ground_truth": 0}, {"key": "37891952", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9821512607233394, "ground_truth": 0}, {"key": "37891952", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9928231172240294, "ground_truth": 0}, {"key": "37891952", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9683812297534363, "ground_truth": 0}, {"key": "40186158", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5926665980884801, "ground_truth": 0}, {"key": "40186158", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4455295240213868, "ground_truth": 0}, {"key": "40186158", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7279754289670922, "ground_truth": 0}, {"key": "40186158", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368150855556, "ground_truth": 0}, {"key": "40186158", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49414089537205014, "ground_truth": 0}, {"key": "37049719", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7008948229622283, "ground_truth": 0}, {"key": "37049719", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7461390004557426, "ground_truth": 0}, {"key": "37049719", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6959583015497731, "ground_truth": 0}, {"key": "37049719", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737407560714, "ground_truth": 0}, {"key": "37049719", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.721743197162538, "ground_truth": 0}, {"key": "34610504", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9079671364249824, "ground_truth": 0}, {"key": "34610504", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8807970866193728, "ground_truth": 0}, {"key": "34610504", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8774767855724616, "ground_truth": 0}, {"key": "34610504", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545663224015, "ground_truth": 0}, {"key": "34610504", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972662645611, "ground_truth": 0}, {"key": "37595429", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7813306424474281, "ground_truth": 0}, {"key": "37595429", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.668880282696557, "ground_truth": 0}, {"key": "37595429", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8128673210999136, "ground_truth": 0}, {"key": "37595429", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367979917723, "ground_truth": 0}, {"key": "37595429", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307595462082, "ground_truth": 0}, {"key": "29772670", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.20307463013994628, "ground_truth": 0}, {"key": "29772670", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5832033443697787, "ground_truth": 0}, {"key": "29772670", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32594952255055754, "ground_truth": 0}, {"key": "29772670", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689614330701, "ground_truth": 0}, {"key": "29772670", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937837876916847, "ground_truth": 0}, {"key": "36369872", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7248703007885688, "ground_truth": 0}, {"key": "36369872", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4092207953328563, "ground_truth": 0}, {"key": "36369872", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7931059470781959, "ground_truth": 0}, {"key": "36369872", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047234066864, "ground_truth": 0}, {"key": "36369872", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281442009008, "ground_truth": 0}, {"key": "34527433", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.48242911753220363, "ground_truth": 0}, {"key": "34527433", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.32594950871524486, "ground_truth": 0}, {"key": "34527433", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.523420378326084, "ground_truth": 0}, {"key": "34527433", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.51171663018241, "ground_truth": 0}, {"key": "34527433", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.31405051427984754, "ground_truth": 0}, {"key": "31111734", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8479677621314424, "ground_truth": 0}, {"key": "31111734", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7233094727913382, "ground_truth": 0}, {"key": "31111734", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8344068873999964, "ground_truth": 0}, {"key": "31111734", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998781515738, "ground_truth": 0}, {"key": "31111734", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637442201338, "ground_truth": 0}, {"key": "40303872", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5583269595812127, "ground_truth": 0}, {"key": "40303872", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7563575754625045, "ground_truth": 0}, {"key": "40303872", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704647667258494, "ground_truth": 0}, {"key": "40303872", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948206491558, "ground_truth": 0}, {"key": "40303872", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575649644853, "ground_truth": 0}, {"key": "33653553", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5195213264638348, "ground_truth": 0}, {"key": "33653553", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5983121895912431, "ground_truth": 0}, {"key": "33653553", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5774953918344806, "ground_truth": 0}, {"key": "33653553", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593431266039, "ground_truth": 0}, {"key": "33653553", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633965500342, "ground_truth": 0}, {"key": "34404510", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575348453505, "ground_truth": 0}, {"key": "34404510", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.712232178307632, "ground_truth": 0}, {"key": "34404510", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7662936359805539, "ground_truth": 0}, {"key": "34404510", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026690330982, "ground_truth": 0}, {"key": "34404510", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.665410556940209, "ground_truth": 0}, {"key": "35568692", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.34334175277854617, "ground_truth": 0}, {"key": "35568692", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.20055768576764277, "ground_truth": 0}, {"key": "35568692", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22405545853408254, "ground_truth": 0}, {"key": "35568692", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364243636627553, "ground_truth": 0}, {"key": "35568692", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106118608123216, "ground_truth": 0}, {"key": "39151664", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4092207768316269, "ground_truth": 0}, {"key": "39151664", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5350984542056662, "ground_truth": 0}, {"key": "39151664", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2658804733921876, "ground_truth": 0}, {"key": "39151664", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39793842381925926, "ground_truth": 0}, {"key": "39151664", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544132688162, "ground_truth": 0}, {"key": "37493670", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.993661078158785, "ground_truth": 0}, {"key": "37493670", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9960851766280401, "ground_truth": 0}, {"key": "37493670", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9964342635801703, "ground_truth": 0}, {"key": "37493670", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9957020612375684, "ground_truth": 0}, {"key": "37493670", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.994779874126059, "ground_truth": 0}, {"key": "21935983", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33633104512682876, "ground_truth": 0}, {"key": "21935983", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.37570647426981363, "ground_truth": 0}, {"key": "21935983", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3468730763410561, "ground_truth": 0}, {"key": "21935983", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981166404532975, "ground_truth": 0}, {"key": "21935983", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304216077860688, "ground_truth": 0}, {"key": "38174214", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8198933397089476, "ground_truth": 0}, {"key": "38174214", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8633916149527596, "ground_truth": 0}, {"key": "38174214", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8418256438999983, "ground_truth": 0}, {"key": "38174214", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325226644397, "ground_truth": 0}, {"key": "38174214", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631578081325, "ground_truth": 0}, {"key": "40319923", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7295197715377235, "ground_truth": 0}, {"key": "40319923", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9425067233913835, "ground_truth": 0}, {"key": "40319923", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8688267713873542, "ground_truth": 0}, {"key": "40319923", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437807151013, "ground_truth": 0}, {"key": "40319923", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.817574491474654, "ground_truth": 0}, {"key": "36478264", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7154240064521725, "ground_truth": 0}, {"key": "36478264", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8300437782603843, "ground_truth": 0}, {"key": "36478264", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7918210885663477, "ground_truth": 0}, {"key": "36478264", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.790530315391174, "ground_truth": 0}, {"key": "36478264", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278532457678, "ground_truth": 0}, {"key": "11935769", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5679366345460722, "ground_truth": 0}, {"key": "11935769", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4824291213960511, "ground_truth": 0}, {"key": "11935769", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5370413929988737, "ground_truth": 0}, {"key": "11935769", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125718459569, "ground_truth": 0}, {"key": "11935769", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199624031493, "ground_truth": 0}, {"key": "33373410", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45713672361318886, "ground_truth": 0}, {"key": "33373410", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5640984814948262, "ground_truth": 0}, {"key": "33373410", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3830641908208276, "ground_truth": 0}, {"key": "33373410", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386100842368975, "ground_truth": 0}, {"key": "33373410", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206880398822006, "ground_truth": 0}, {"key": "11130680", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7745833962035317, "ground_truth": 0}, {"key": "11130680", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8670357655132288, "ground_truth": 0}, {"key": "11130680", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.24944723694351928, "ground_truth": 0}, {"key": "11130680", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549543030093, "ground_truth": 0}, {"key": "11130680", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056322118513171, "ground_truth": 0}, {"key": "34868650", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7295197833625969, "ground_truth": 0}, {"key": "34868650", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5448014050518003, "ground_truth": 0}, {"key": "34868650", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9066531151852643, "ground_truth": 0}, {"key": "34868650", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918276401889, "ground_truth": 0}, {"key": "34868650", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269238192071, "ground_truth": 0}, {"key": "33960561", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5869964236667174, "ground_truth": 0}, {"key": "33960561", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3363310495935763, "ground_truth": 0}, {"key": "33960561", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5195213225366958, "ground_truth": 0}, {"key": "33960561", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413679750894, "ground_truth": 0}, {"key": "33960561", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487696509161, "ground_truth": 0}, {"key": "22504858", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6020616022123826, "ground_truth": 0}, {"key": "22504858", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.809275983897273, "ground_truth": 0}, {"key": "22504858", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063656823505, "ground_truth": 0}, {"key": "22504858", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884689747239, "ground_truth": 0}, {"key": "22504858", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058590974483819, "ground_truth": 0}, {"key": "32283530", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5851011690028728, "ground_truth": 0}, {"key": "32283530", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6460136816166979, "ground_truth": 0}, {"key": "32283530", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7662936607944036, "ground_truth": 0}, {"key": "32283530", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325173995141, "ground_truth": 0}, {"key": "32283530", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.620621615274945, "ground_truth": 0}, {"key": "38377099", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9092645127882181, "ground_truth": 0}, {"key": "38377099", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8152324794428146, "ground_truth": 0}, {"key": "38377099", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8469578555420483, "ground_truth": 0}, {"key": "38377099", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.816406390334499, "ground_truth": 0}, {"key": "38377099", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338565138934, "ground_truth": 0}, {"key": "36105123", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8799743635743399, "ground_truth": 0}, {"key": "36105123", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9473810446812139, "ground_truth": 0}, {"key": "36105123", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.937210788810091, "ground_truth": 0}, {"key": "36105123", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099516481777, "ground_truth": 0}, {"key": "36105123", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9334308124373616, "ground_truth": 0}, {"key": "33527826", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8577681035445989, "ground_truth": 0}, {"key": "33527826", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8244619354182771, "ground_truth": 0}, {"key": "33527826", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.852935491328925, "ground_truth": 0}, {"key": "33527826", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872045875325045, "ground_truth": 0}, {"key": "33527826", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972648884356, "ground_truth": 0}, {"key": "32349891", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5486735130070095, "ground_truth": 0}, {"key": "32349891", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358378086734, "ground_truth": 0}, {"key": "32349891", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059150738874, "ground_truth": 0}, {"key": "32349891", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241538248365, "ground_truth": 0}, {"key": "32349891", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563512790378, "ground_truth": 0}, {"key": "34281974", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7994423214813422, "ground_truth": 0}, {"key": "34281974", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6113819958937707, "ground_truth": 0}, {"key": "34281974", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7839884720277251, "ground_truth": 0}, {"key": "34281974", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808785893592151, "ground_truth": 0}, {"key": "34281974", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593220844393, "ground_truth": 0}, {"key": "29387866", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.674050466537381, "ground_truth": 0}, {"key": "29387866", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5486734877541339, "ground_truth": 0}, {"key": "29387866", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7264256175759054, "ground_truth": 0}, {"key": "29387866", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3629692148122506, "ground_truth": 0}, {"key": "29387866", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387586273824397, "ground_truth": 0}, {"key": "35731925", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9899864293400764, "ground_truth": 0}, {"key": "35731925", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.996054593252398, "ground_truth": 0}, {"key": "35731925", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9859363727273006, "ground_truth": 0}, {"key": "35731925", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9931495204780139, "ground_truth": 0}, {"key": "35731925", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9962345861424711, "ground_truth": 0}, {"key": "38829733", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8976953019875362, "ground_truth": 0}, {"key": "38829733", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948049282883, "ground_truth": 0}, {"key": "38829733", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8757870082654957, "ground_truth": 0}, {"key": "38829733", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647137753449, "ground_truth": 0}, {"key": "38829733", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601398430835, "ground_truth": 0}, {"key": "24624736", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9019206740277866, "ground_truth": 0}, {"key": "24624736", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8976953107306943, "ground_truth": 0}, {"key": "24624736", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8832359938954708, "ground_truth": 0}, {"key": "24624736", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681030629913, "ground_truth": 0}, {"key": "24624736", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767776013951, "ground_truth": 0}, {"key": "36928562", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9807288630560599, "ground_truth": 0}, {"key": "36928562", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9529258214012019, "ground_truth": 0}, {"key": "36928562", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9711290918197429, "ground_truth": 0}, {"key": "36928562", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.983970853125975, "ground_truth": 0}, {"key": "36928562", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.977542946348604, "ground_truth": 0}, {"key": "34941119", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3702254123225903, "ground_truth": 0}, {"key": "34941119", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.44167298996186866, "ground_truth": 0}, {"key": "34941119", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4263216117421349, "ground_truth": 0}, {"key": "34941119", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.586996413857301, "ground_truth": 0}, {"key": "34941119", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4263215971026848, "ground_truth": 0}, {"key": "30206231", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199300278909, "ground_truth": 0}, {"key": "30206231", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4804786668888554, "ground_truth": 0}, {"key": "30206231", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3328523422127972, "ground_truth": 0}, {"key": "30206231", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136895732139, "ground_truth": 0}, {"key": "30206231", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633153082166725, "ground_truth": 0}, {"key": "35584972", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4130035821691108, "ground_truth": 0}, {"key": "35584972", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6654105751994132, "ground_truth": 0}, {"key": "35584972", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292634034966021, "ground_truth": 0}, {"key": "35584972", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375413333517, "ground_truth": 0}, {"key": "35584972", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544343400009, "ground_truth": 0}, {"key": "39277709", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.887984051077604, "ground_truth": 0}, {"key": "39277709", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9529258185925426, "ground_truth": 0}, {"key": "39277709", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8766343706747012, "ground_truth": 0}, {"key": "39277709", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549623002968, "ground_truth": 0}, {"key": "39277709", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354808912678, "ground_truth": 0}, {"key": "36123657", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8152325038152658, "ground_truth": 0}, {"key": "36123657", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.870597264947249, "ground_truth": 0}, {"key": "36123657", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8688267758976699, "ground_truth": 0}, {"key": "36123657", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.805632166845885, "ground_truth": 0}, {"key": "36123657", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757870056883856, "ground_truth": 0}, {"key": "33363938", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8006919896826111, "ground_truth": 0}, {"key": "33363938", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4111108521508858, "ground_truth": 0}, {"key": "33363938", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8080672101514028, "ground_truth": 0}, {"key": "33363938", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080831320269, "ground_truth": 0}, {"key": "33363938", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267118006400587, "ground_truth": 0}, {"key": "37349129", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.68257373516295, "ground_truth": 0}, {"key": "37349129", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.47073659172138743, "ground_truth": 0}, {"key": "37349129", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7248702863622042, "ground_truth": 0}, {"key": "37349129", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300702744148, "ground_truth": 0}, {"key": "37349129", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746167066799, "ground_truth": 0}, {"key": "37160199", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5717666036945105, "ground_truth": 0}, {"key": "37160199", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4687906103965036, "ground_truth": 0}, {"key": "37160199", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3328523374388765, "ground_truth": 0}, {"key": "37160199", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4532618449716675, "ground_truth": 0}, {"key": "37160199", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939261427483745, "ground_truth": 0}, {"key": "35891053", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8469578335745155, "ground_truth": 0}, {"key": "35891053", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8679338517944597, "ground_truth": 0}, {"key": "35891053", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.87831424696773, "ground_truth": 0}, {"key": "35891053", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070064194877, "ground_truth": 0}, {"key": "35891053", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354774249988, "ground_truth": 0}, {"key": "40694542", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5832033387643354, "ground_truth": 0}, {"key": "40694542", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5640984953223488, "ground_truth": 0}, {"key": "40694542", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7248702791561519, "ground_truth": 0}, {"key": "40694542", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624747507434, "ground_truth": 0}, {"key": "40694542", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020616019113783, "ground_truth": 0}, {"key": "24645770", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5907792213288238, "ground_truth": 0}, {"key": "24645770", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8428631387977628, "ground_truth": 0}, {"key": "24645770", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.800691993870672, "ground_truth": 0}, {"key": "24645770", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148208905784, "ground_truth": 0}, {"key": "24645770", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982490114089, "ground_truth": 0}, {"key": "37974587", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8895288433235369, "ground_truth": 0}, {"key": "37974587", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9536217950349225, "ground_truth": 0}, {"key": "37974587", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.88563146884699, "ground_truth": 0}, {"key": "37974587", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311898420897, "ground_truth": 0}, {"key": "37974587", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.921921828675, "ground_truth": 0}, {"key": "40354149", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7090191450801144, "ground_truth": 0}, {"key": "40354149", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7732163607842567, "ground_truth": 0}, {"key": "40354149", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7892336865508844, "ground_truth": 0}, {"key": "40354149", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241504542113, "ground_truth": 0}, {"key": "40354149", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.67917871712495, "ground_truth": 0}, {"key": "35519470", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.39981167617435703, "ground_truth": 0}, {"key": "35519470", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39420098473651705, "ground_truth": 0}, {"key": "35519470", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.31405053201733985, "ground_truth": 0}, {"key": "35519470", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39047582097848876, "ground_truth": 0}, {"key": "35519470", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678050904112, "ground_truth": 0}, {"key": "36185624", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8679338429917792, "ground_truth": 0}, {"key": "36185624", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.798186797383319, "ground_truth": 0}, {"key": "36185624", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9149009581364013, "ground_truth": 0}, {"key": "36185624", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094651874481, "ground_truth": 0}, {"key": "36185624", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545507708361, "ground_truth": 0}, {"key": "39306113", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3904758485422809, "ground_truth": 0}, {"key": "39306113", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4054487423912505, "ground_truth": 0}, {"key": "39306113", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4397473383564115, "ground_truth": 0}, {"key": "39306113", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39420096145984473, "ground_truth": 0}, {"key": "39306113", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922077905579163, "ground_truth": 0}, {"key": "19347718", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8006919936058403, "ground_truth": 0}, {"key": "19347718", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40733338465878094, "ground_truth": 0}, {"key": "19347718", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5486734821699258, "ground_truth": 0}, {"key": "19347718", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621764950051911, "ground_truth": 0}, {"key": "19347718", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306259648642, "ground_truth": 0}, {"key": "21870064", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5869964435976442, "ground_truth": 0}, {"key": "21870064", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.22953521867860205, "ground_truth": 0}, {"key": "21870064", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4610167744875237, "ground_truth": 0}, {"key": "21870064", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398629391749464, "ground_truth": 0}, {"key": "21870064", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.577495339913552, "ground_truth": 0}, {"key": "37675776", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8910549512231803, "ground_truth": 0}, {"key": "37675776", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9425067181481376, "ground_truth": 0}, {"key": "37675776", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8596637430887116, "ground_truth": 0}, {"key": "37675776", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511345427774, "ground_truth": 0}, {"key": "37675776", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898183760373, "ground_truth": 0}, {"key": "38107017", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804329727286, "ground_truth": 0}, {"key": "38107017", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7534666749932396, "ground_truth": 0}, {"key": "38107017", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8175744739955655, "ground_truth": 0}, {"key": "38107017", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740203985491, "ground_truth": 0}, {"key": "38107017", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982342933993, "ground_truth": 0}, {"key": "40046472", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4397473728875021, "ground_truth": 0}, {"key": "40046472", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.663668943509898, "ground_truth": 0}, {"key": "40046472", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6039318480298105, "ground_truth": 0}, {"key": "40046472", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397332458303, "ground_truth": 0}, {"key": "40046472", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594950857563804, "ground_truth": 0}, {"key": "32157820", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6224593240195635, "ground_truth": 0}, {"key": "32157820", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7620701055414864, "ground_truth": 0}, {"key": "32157820", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.590779208371155, "ground_truth": 0}, {"key": "32157820", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938467844061, "ground_truth": 0}, {"key": "32157820", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.529263386288172, "ground_truth": 0}, {"key": "41004037", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6406358646295336, "ground_truth": 0}, {"key": "41004037", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039318360081762, "ground_truth": 0}, {"key": "41004037", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6406358628264902, "ground_truth": 0}, {"key": "41004037", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352663271163, "ground_truth": 0}, {"key": "41004037", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746105147808, "ground_truth": 0}, {"key": "21387993", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5621765091806864, "ground_truth": 0}, {"key": "21387993", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251059107544, "ground_truth": 0}, {"key": "21387993", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575640269253, "ground_truth": 0}, {"key": "21387993", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295322661608, "ground_truth": 0}, {"key": "21387993", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527660900646, "ground_truth": 0}, {"key": "34665539", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5428632868370725, "ground_truth": 0}, {"key": "34665539", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6279512040795066, "ground_truth": 0}, {"key": "34665539", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4167966627080775, "ground_truth": 0}, {"key": "34665539", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984122193497, "ground_truth": 0}, {"key": "34665539", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256051245136, "ground_truth": 0}, {"key": "37872111", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.562176508094481, "ground_truth": 0}, {"key": "37872111", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7813306282587733, "ground_truth": 0}, {"key": "37872111", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8489721852631363, "ground_truth": 0}, {"key": "37872111", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4186968880151558, "ground_truth": 0}, {"key": "37872111", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365943210611, "ground_truth": 0}, {"key": "36629542", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7918210711325888, "ground_truth": 0}, {"key": "36629542", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358421932153, "ground_truth": 0}, {"key": "36629542", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7905303170567902, "ground_truth": 0}, {"key": "36629542", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.640635842894465, "ground_truth": 0}, {"key": "36629542", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416400838555, "ground_truth": 0}, {"key": "36487527", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8386797567787069, "ground_truth": 0}, {"key": "36487527", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4824291268483717, "ground_truth": 0}, {"key": "36487527", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7994423263645885, "ground_truth": 0}, {"key": "36487527", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117944935177, "ground_truth": 0}, {"key": "36487527", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267658288471, "ground_truth": 0}, {"key": "37344756", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8354835313740364, "ground_truth": 0}, {"key": "37344756", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7446563347096712, "ground_truth": 0}, {"key": "37344756", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7295197633993666, "ground_truth": 0}, {"key": "37344756", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.627951204525132, "ground_truth": 0}, {"key": "37344756", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358746857712, "ground_truth": 0}, {"key": "38707722", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47852883845998695, "ground_truth": 0}, {"key": "38707722", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45907612328937625, "ground_truth": 0}, {"key": "38707722", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3886180182875628, "ground_truth": 0}, {"key": "38707722", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688131505581, "ground_truth": 0}, {"key": "38707722", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203801596471, "ground_truth": 0}, {"key": "37093419", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.37570645105991346, "ground_truth": 0}, {"key": "37093419", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.1233656171988478, "ground_truth": 0}, {"key": "37093419", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2643583487173015, "ground_truth": 0}, {"key": "37093419", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022539009130534, "ground_truth": 0}, {"key": "37093419", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455655398614, "ground_truth": 0}, {"key": "35547391", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5774953685633488, "ground_truth": 0}, {"key": "35547391", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.48828339536321785, "ground_truth": 0}, {"key": "35547391", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5175709022964582, "ground_truth": 0}, {"key": "35547391", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834721633797, "ground_truth": 0}, {"key": "35547391", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881386222909, "ground_truth": 0}, {"key": "37173168", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.702530057741544, "ground_truth": 0}, {"key": "37173168", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5621765206024626, "ground_truth": 0}, {"key": "37173168", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6076631844796154, "ground_truth": 0}, {"key": "37173168", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.729519786810087, "ground_truth": 0}, {"key": "37173168", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381894413683, "ground_truth": 0}, {"key": "30725298", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.888758793799458, "ground_truth": 0}, {"key": "30725298", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.76207010743267, "ground_truth": 0}, {"key": "30725298", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.861538204437324, "ground_truth": 0}, {"key": "30725298", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743817260015, "ground_truth": 0}, {"key": "30725298", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721905824755, "ground_truth": 0}, {"key": "33830573", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9086178988827178, "ground_truth": 0}, {"key": "33830573", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7981867922472279, "ground_truth": 0}, {"key": "33830573", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.870597250318932, "ground_truth": 0}, {"key": "33830573", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122167886882, "ground_truth": 0}, {"key": "33830573", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307544188793, "ground_truth": 0}, {"key": "33415474", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.26894143952549077, "ground_truth": 0}, {"key": "33415474", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.20181322188560175, "ground_truth": 0}, {"key": "33415474", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.13117322640742607, "ground_truth": 0}, {"key": "33415474", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713268531950766, "ground_truth": 0}, {"key": "33415474", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.15817435175866462, "ground_truth": 0}, {"key": "37383994", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8519527934454193, "ground_truth": 0}, {"key": "37383994", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.966155966149071, "ground_truth": 0}, {"key": "37383994", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.892562517249479, "ground_truth": 0}, {"key": "37383994", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.960062684052718, "ground_truth": 0}, {"key": "37383994", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9529258230756612, "ground_truth": 0}, {"key": "38576819", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802562713896, "ground_truth": 0}, {"key": "38576819", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.596433150261037, "ground_truth": 0}, {"key": "38576819", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.529263383686545, "ground_truth": 0}, {"key": "38576819", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117918817481, "ground_truth": 0}, {"key": "38576819", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563457236578, "ground_truth": 0}, {"key": "34500226", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7170118716798101, "ground_truth": 0}, {"key": "34500226", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7943849598879567, "ground_truth": 0}, {"key": "34500226", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6020615721693688, "ground_truth": 0}, {"key": "34500226", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312170520416, "ground_truth": 0}, {"key": "34500226", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063843282969, "ground_truth": 0}, {"key": "39856394", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.778649296459649, "ground_truth": 0}, {"key": "39856394", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5039061525508793, "ground_truth": 0}, {"key": "39856394", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6842640208202457, "ground_truth": 0}, {"key": "39856394", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.713830752519126, "ground_truth": 0}, {"key": "39856394", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737231754941, "ground_truth": 0}, {"key": "35499522", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.20181323284434366, "ground_truth": 0}, {"key": "35499522", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4493926098317071, "ground_truth": 0}, {"key": "35499522", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3073580163094027, "ground_truth": 0}, {"key": "35499522", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.18832398029163316, "ground_truth": 0}, {"key": "35499522", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1812632140563043, "ground_truth": 0}, {"key": "30157766", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8255897086057935, "ground_truth": 0}, {"key": "30157766", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9039745153430869, "ground_truth": 0}, {"key": "30157766", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8539127513405881, "ground_truth": 0}, {"key": "30157766", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070022119875, "ground_truth": 0}, {"key": "30157766", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711732126244, "ground_truth": 0}, {"key": "40472346", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8705972631686806, "ground_truth": 0}, {"key": "40472346", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.857768108685022, "ground_truth": 0}, {"key": "40472346", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8688267781603068, "ground_truth": 0}, {"key": "40472346", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430373044219, "ground_truth": 0}, {"key": "40472346", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894570197159, "ground_truth": 0}, {"key": "35305635", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9118099521995219, "ground_truth": 0}, {"key": "35305635", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8816149077961632, "ground_truth": 0}, {"key": "35305635", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8910549546418605, "ground_truth": 0}, {"key": "35305635", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9390248220770608, "ground_truth": 0}, {"key": "35305635", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505345517537, "ground_truth": 0}, {"key": "32495926", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8140528050533845, "ground_truth": 0}, {"key": "32495926", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6859494414147125, "ground_truth": 0}, {"key": "32495926", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7264256056158049, "ground_truth": 0}, {"key": "32495926", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122322069634884, "ground_truth": 0}, {"key": "32495926", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366426807941, "ground_truth": 0}, {"key": "37353801", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6495786262087502, "ground_truth": 0}, {"key": "37353801", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5117166034502247, "ground_truth": 0}, {"key": "37353801", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5698526506849221, "ground_truth": 0}, {"key": "37353801", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881408707502, "ground_truth": 0}, {"key": "37353801", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073462036701, "ground_truth": 0}, {"key": "30159904", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7866228103868474, "ground_truth": 0}, {"key": "30159904", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8509647018837476, "ground_truth": 0}, {"key": "30159904", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7431679965867042, "ground_truth": 0}, {"key": "30159904", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.824461938197038, "ground_truth": 0}, {"key": "30159904", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702701108056, "ground_truth": 0}, {"key": "33698679", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46490158714794444, "ground_truth": 0}, {"key": "33698679", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6825737418580072, "ground_truth": 0}, {"key": "33698679", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40922078559136005, "ground_truth": 0}, {"key": "33698679", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324805373244, "ground_truth": 0}, {"key": "33698679", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.674050481407764, "ground_truth": 0}, {"key": "40530172", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8757869919517547, "ground_truth": 0}, {"key": "40530172", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506390057315, "ground_truth": 0}, {"key": "40530172", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.519521334917557, "ground_truth": 0}, {"key": "40530172", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476645251964, "ground_truth": 0}, {"key": "40530172", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792235385575, "ground_truth": 0}, {"key": "40652941", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8832359814639871, "ground_truth": 0}, {"key": "40652941", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8633915973534678, "ground_truth": 0}, {"key": "40652941", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8840392778964407, "ground_truth": 0}, {"key": "40652941", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760263773548, "ground_truth": 0}, {"key": "40652941", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619418963367, "ground_truth": 0}, {"key": "40122246", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832306428834, "ground_truth": 0}, {"key": "40122246", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.49023558814992585, "ground_truth": 0}, {"key": "40122246", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3522017893385864, "ground_truth": 0}, {"key": "40122246", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016877923576201, "ground_truth": 0}, {"key": "40122246", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2267836316098326, "ground_truth": 0}, {"key": "40032656", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8998277950611892, "ground_truth": 0}, {"key": "40032656", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7416740122649542, "ground_truth": 0}, {"key": "40032656", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7446563459074997, "ground_truth": 0}, {"key": "40032656", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797739889474, "ground_truth": 0}, {"key": "40032656", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675318902016, "ground_truth": 0}, {"key": "38913680", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6654105389556733, "ground_truth": 0}, {"key": "38913680", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5312093712694529, "ground_truth": 0}, {"key": "38913680", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.705785021744108, "ground_truth": 0}, {"key": "38913680", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.627951215176736, "ground_truth": 0}, {"key": "38913680", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762946720935, "ground_truth": 0}, {"key": "17608039", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6601723964306475, "ground_truth": 0}, {"key": "17608039", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.373875838270652, "ground_truth": 0}, {"key": "17608039", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2942149628202661, "ground_truth": 0}, {"key": "17608039", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.1871326826325869, "ground_truth": 0}, {"key": "17608039", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.27202455301394235, "ground_truth": 0}, {"key": "40434901", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9118099569548437, "ground_truth": 0}, {"key": "40434901", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7799929088312149, "ground_truth": 0}, {"key": "40434901", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8824278550427992, "ground_truth": 0}, {"key": "40434901", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933758243607, "ground_truth": 0}, {"key": "40434901", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9403530582134506, "ground_truth": 0}, {"key": "37680058", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.205615056066805, "ground_truth": 0}, {"key": "37680058", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.16559311375290972, "ground_truth": 0}, {"key": "37680058", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583269692361171, "ground_truth": 0}, {"key": "37680058", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26435836817018127, "ground_truth": 0}, {"key": "37680058", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3123700116715768, "ground_truth": 0}, {"key": "37291821", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7826624786960029, "ground_truth": 0}, {"key": "37291821", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5583270244807172, "ground_truth": 0}, {"key": "37291821", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6477982126020332, "ground_truth": 0}, {"key": "37291821", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527791824262, "ground_truth": 0}, {"key": "37291821", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.74167401695001, "ground_truth": 0}, {"key": "41002743", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6791787074133268, "ground_truth": 0}, {"key": "41002743", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8469578384531206, "ground_truth": 0}, {"key": "41002743", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5907791908223606, "ground_truth": 0}, {"key": "41002743", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163559119779, "ground_truth": 0}, {"key": "41002743", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.71383074921781, "ground_truth": 0}, {"key": "36322869", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7786493154588006, "ground_truth": 0}, {"key": "36322869", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9118099563435698, "ground_truth": 0}, {"key": "36322869", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.890294228947861, "ground_truth": 0}, {"key": "36322869", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526141102876, "ground_truth": 0}, {"key": "36322869", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343816288744, "ground_truth": 0}, {"key": "39459717", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7690802576912865, "ground_truth": 0}, {"key": "39459717", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7371581600403874, "ground_truth": 0}, {"key": "39459717", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8848377788540144, "ground_truth": 0}, {"key": "39459717", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759843554678, "ground_truth": 0}, {"key": "39459717", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.847967748818136, "ground_truth": 0}, {"key": "36503727", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5331544095369054, "ground_truth": 0}, {"key": "36503727", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5964331389394555, "ground_truth": 0}, {"key": "36503727", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49609383565510423, "ground_truth": 0}, {"key": "36503727", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918396404281, "ground_truth": 0}, {"key": "36503727", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646186747394, "ground_truth": 0}, {"key": "35682367", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8895288385144224, "ground_truth": 0}, {"key": "35682367", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.95464741595797, "ground_truth": 0}, {"key": "35682367", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292634038091907, "ground_truth": 0}, {"key": "35682367", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631486255375, "ground_truth": 0}, {"key": "35682367", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786268712972, "ground_truth": 0}, {"key": "36472353", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.577495357148247, "ground_truth": 0}, {"key": "36472353", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.754914970683364, "ground_truth": 0}, {"key": "36472353", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5983121915877545, "ground_truth": 0}, {"key": "36472353", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358203540068, "ground_truth": 0}, {"key": "36472353", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283271655729, "ground_truth": 0}, {"key": "37651907", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6842640276039833, "ground_truth": 0}, {"key": "37651907", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5409238770556468, "ground_truth": 0}, {"key": "37651907", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5506074042007844, "ground_truth": 0}, {"key": "37651907", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615640850246, "ground_truth": 0}, {"key": "37651907", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.65665828414031, "ground_truth": 0}, {"key": "36255476", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802748022883, "ground_truth": 0}, {"key": "36255476", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5964331352062672, "ground_truth": 0}, {"key": "36255476", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.680878618745814, "ground_truth": 0}, {"key": "36255476", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897198429081, "ground_truth": 0}, {"key": "36255476", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435105744461, "ground_truth": 0}, {"key": "37283518", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7969253824458361, "ground_truth": 0}, {"key": "37283518", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8688267777113106, "ground_truth": 0}, {"key": "37283518", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7154239984054531, "ground_truth": 0}, {"key": "37283518", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445486737409, "ground_truth": 0}, {"key": "37283518", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324939906614, "ground_truth": 0}, {"key": "34906785", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7325918361602319, "ground_truth": 0}, {"key": "34906785", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.811676034676867, "ground_truth": 0}, {"key": "34906785", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5563995726911494, "ground_truth": 0}, {"key": "34906785", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689369727663, "ground_truth": 0}, {"key": "34906785", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893055926787788, "ground_truth": 0}, {"key": "34965328", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9005297905602192, "ground_truth": 0}, {"key": "34965328", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8428631439034373, "ground_truth": 0}, {"key": "34965328", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8697145900498512, "ground_truth": 0}, {"key": "34965328", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215433704157, "ground_truth": 0}, {"key": "34965328", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891349676304, "ground_truth": 0}, {"key": "38788440", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4167966282267397, "ground_truth": 0}, {"key": "38788440", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251279726524, "ground_truth": 0}, {"key": "38788440", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3775406698987632, "ground_truth": 0}, {"key": "38788440", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746032843170386, "ground_truth": 0}, {"key": "38788440", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2798285106104399, "ground_truth": 0}, {"key": "35046866", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9086178985755168, "ground_truth": 0}, {"key": "35046866", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9207896804278456, "ground_truth": 0}, {"key": "35046866", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8895288545879246, "ground_truth": 0}, {"key": "35046866", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467799393438, "ground_truth": 0}, {"key": "35046866", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745171371244, "ground_truth": 0}, {"key": "37629558", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3998116434891486, "ground_truth": 0}, {"key": "37629558", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.637030790190115, "ground_truth": 0}, {"key": "37629558", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4092208085187518, "ground_truth": 0}, {"key": "37629558", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938524667094, "ground_truth": 0}, {"key": "37629558", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "33859914", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7461389982225063, "ground_truth": 0}, {"key": "33859914", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7563575597056574, "ground_truth": 0}, {"key": "33859914", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7090191214365134, "ground_truth": 0}, {"key": "33859914", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046767961952, "ground_truth": 0}, {"key": "33859914", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.658417468190754, "ground_truth": 0}, {"key": "39790523", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.889528841863185, "ground_truth": 0}, {"key": "39790523", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8187367940773965, "ground_truth": 0}, {"key": "39790523", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.90329421746625, "ground_truth": 0}, {"key": "39790523", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884661987693, "ground_truth": 0}, {"key": "39790523", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026096083652972, "ground_truth": 0}, {"key": "33509656", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46101678298696885, "ground_truth": 0}, {"key": "33509656", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5273165385130001, "ground_truth": 0}, {"key": "33509656", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4282334139065494, "ground_truth": 0}, {"key": "33509656", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473500483472, "ground_truth": 0}, {"key": "33509656", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315943406320143, "ground_truth": 0}, {"key": "17380923", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8587185746663114, "ground_truth": 0}, {"key": "17380923", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8596637605750511, "ground_truth": 0}, {"key": "17380923", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8068526289083487, "ground_truth": 0}, {"key": "17380923", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104511468122, "ground_truth": 0}, {"key": "17380923", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213789652123, "ground_truth": 0}, {"key": "36202526", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6315943070985823, "ground_truth": 0}, {"key": "36202526", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8606036247809495, "ground_truth": 0}, {"key": "36202526", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6688802551022917, "ground_truth": 0}, {"key": "36202526", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.734119538715309, "ground_truth": 0}, {"key": "36202526", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.816406365612669, "ground_truth": 0}, {"key": "26419232", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7431679879298915, "ground_truth": 0}, {"key": "26419232", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7732163449333991, "ground_truth": 0}, {"key": "26419232", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7662936341228578, "ground_truth": 0}, {"key": "26419232", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477981823193787, "ground_truth": 0}, {"key": "26419232", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916098515492, "ground_truth": 0}, {"key": "34232398", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6943026792160142, "ground_truth": 0}, {"key": "34232398", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.805632189350092, "ground_truth": 0}, {"key": "34232398", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7892336999667332, "ground_truth": 0}, {"key": "34232398", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637546349898, "ground_truth": 0}, {"key": "34232398", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825850717544, "ground_truth": 0}, {"key": "33586045", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7233094693991808, "ground_truth": 0}, {"key": "33586045", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.848972186335469, "ground_truth": 0}, {"key": "33586045", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7401743599809177, "ground_truth": 0}, {"key": "33586045", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306202875524, "ground_truth": 0}, {"key": "33586045", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601318040241, "ground_truth": 0}, {"key": "32281151", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5813030563372397, "ground_truth": 0}, {"key": "32281151", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5156199366615243, "ground_truth": 0}, {"key": "32281151", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41489885292187395, "ground_truth": 0}, {"key": "32281151", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331543898608275, "ground_truth": 0}, {"key": "32281151", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743832160608, "ground_truth": 0}, {"key": "37308159", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8479677478634691, "ground_truth": 0}, {"key": "37308159", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8872045919694325, "ground_truth": 0}, {"key": "37308159", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8757869907575048, "ground_truth": 0}, {"key": "37308159", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9416541596849732, "ground_truth": 0}, {"key": "37308159", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.874934620726947, "ground_truth": 0}, {"key": "35694408", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9086179005974236, "ground_truth": 0}, {"key": "35694408", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9572778028592019, "ground_truth": 0}, {"key": "35694408", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8019358407060673, "ground_truth": 0}, {"key": "35694408", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740061793011, "ground_truth": 0}, {"key": "35694408", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.684264002852863, "ground_truth": 0}, {"key": "39781995", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.409220783031752, "ground_truth": 0}, {"key": "39781995", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5389831956563136, "ground_truth": 0}, {"key": "39781995", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984845485563, "ground_truth": 0}, {"key": "39781995", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4397473502998697, "ground_truth": 0}, {"key": "39781995", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531271408493, "ground_truth": 0}, {"key": "22799372", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9441768592015161, "ground_truth": 0}, {"key": "22799372", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9615338065313268, "ground_truth": 0}, {"key": "22799372", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9358173581823772, "ground_truth": 0}, {"key": "22799372", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9412234454701458, "ground_truth": 0}, {"key": "22799372", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.977542945855965, "ground_truth": 0}, {"key": "37428240", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6876299977167295, "ground_truth": 0}, {"key": "37428240", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6601723938159214, "ground_truth": 0}, {"key": "37428240", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6876300012628515, "ground_truth": 0}, {"key": "37428240", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307863773848, "ground_truth": 0}, {"key": "37428240", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191317468996, "ground_truth": 0}, {"key": "40612657", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9500414825057142, "ground_truth": 0}, {"key": "40612657", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.982557515811744, "ground_truth": 0}, {"key": "40612657", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9569571519977296, "ground_truth": 0}, {"key": "40612657", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.97046466117177, "ground_truth": 0}, {"key": "40612657", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9796676487693194, "ground_truth": 0}, {"key": "34404662", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.798186791761898, "ground_truth": 0}, {"key": "34404662", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8164063769158738, "ground_truth": 0}, {"key": "34404662", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7201715256206667, "ground_truth": 0}, {"key": "34404662", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423310989865, "ground_truth": 0}, {"key": "34404662", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743551562006, "ground_truth": 0}, {"key": "32619704", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46684557566720014, "ground_truth": 0}, {"key": "32619704", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5273165347468906, "ground_truth": 0}, {"key": "32619704", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6740504783189286, "ground_truth": 0}, {"key": "32619704", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544237540715, "ground_truth": 0}, {"key": "32619704", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254080917098, "ground_truth": 0}, {"key": "39014883", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7620700937469658, "ground_truth": 0}, {"key": "39014883", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5175708726100271, "ground_truth": 0}, {"key": "39014883", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365325771644, "ground_truth": 0}, {"key": "39014883", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762902830453, "ground_truth": 0}, {"key": "39014883", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832160147855, "ground_truth": 0}, {"key": "37982812", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8428631455530939, "ground_truth": 0}, {"key": "37982812", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8568122836264257, "ground_truth": 0}, {"key": "37982812", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.90397451433285, "ground_truth": 0}, {"key": "37982812", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9522199288653891, "ground_truth": 0}, {"key": "37982812", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9394706107649564, "ground_truth": 0}, {"key": "28123476", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8643104485326192, "ground_truth": 0}, {"key": "28123476", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7931059597354937, "ground_truth": 0}, {"key": "28123476", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7662936509185796, "ground_truth": 0}, {"key": "28123476", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897437842944, "ground_truth": 0}, {"key": "28123476", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721914855483, "ground_truth": 0}, {"key": "39078849", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6859494834632307, "ground_truth": 0}, {"key": "39078849", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6601723920590331, "ground_truth": 0}, {"key": "39078849", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7799928810958647, "ground_truth": 0}, {"key": "39078849", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026821697796, "ground_truth": 0}, {"key": "39078849", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434965836555, "ground_truth": 0}, {"key": "39414137", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9543079699946312, "ground_truth": 0}, {"key": "39414137", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9299510479772533, "ground_truth": 0}, {"key": "39414137", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9273632906561684, "ground_truth": 0}, {"key": "39414137", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892684904275, "ground_truth": 0}, {"key": "39414137", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9556514148044534, "ground_truth": 0}, {"key": "37371354", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6976089149137412, "ground_truth": 0}, {"key": "37371354", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7620700990968479, "ground_truth": 0}, {"key": "37371354", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6187804314441512, "ground_truth": 0}, {"key": "37371354", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531268953015749, "ground_truth": 0}, {"key": "37371354", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283043444652, "ground_truth": 0}, {"key": "29497179", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8824278719267926, "ground_truth": 0}, {"key": "29497179", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8365545472656503, "ground_truth": 0}, {"key": "29497179", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8233283840989174, "ground_truth": 0}, {"key": "29497179", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267710222193, "ground_truth": 0}, {"key": "29497179", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942250675585, "ground_truth": 0}, {"key": "35908694", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9111796999196277, "ground_truth": 0}, {"key": "35908694", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9669140210813661, "ground_truth": 0}, {"key": "35908694", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9358173560772847, "ground_truth": 0}, {"key": "35908694", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625147802272, "ground_truth": 0}, {"key": "35908694", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9284088029535484, "ground_truth": 0}, {"key": "37619358", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.62612419955927, "ground_truth": 0}, {"key": "37619358", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6388352689627681, "ground_truth": 0}, {"key": "37619358", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49609383088529774, "ground_truth": 0}, {"key": "37619358", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273164990410254, "ground_truth": 0}, {"key": "37619358", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548946881588286, "ground_truth": 0}, {"key": "37293103", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6842640266799417, "ground_truth": 0}, {"key": "37293103", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7577943757134761, "ground_truth": 0}, {"key": "37293103", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8568122978661585, "ground_truth": 0}, {"key": "37293103", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823365915571, "ground_truth": 0}, {"key": "37293103", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.875786990536988, "ground_truth": 0}, {"key": "36883729", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7866228346568458, "ground_truth": 0}, {"key": "36883729", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717666185838758, "ground_truth": 0}, {"key": "36883729", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365418330059, "ground_truth": 0}, {"key": "36883729", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389804755416, "ground_truth": 0}, {"key": "36883729", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.507811873663831, "ground_truth": 0}, {"key": "39209521", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7648916072333571, "ground_truth": 0}, {"key": "39209521", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6774740267115645, "ground_truth": 0}, {"key": "39209521", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7233094657555605, "ground_truth": 0}, {"key": "39209521", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701039613756, "ground_truth": 0}, {"key": "39209521", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256225780875, "ground_truth": 0}, {"key": "27792571", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8397339667440045, "ground_truth": 0}, {"key": "27792571", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.888758792864978, "ground_truth": 0}, {"key": "27792571", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370307928089958, "ground_truth": 0}, {"key": "27792571", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933781162272, "ground_truth": 0}, {"key": "27792571", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748519431487, "ground_truth": 0}, {"key": "39755647", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7154240207987891, "ground_truth": 0}, {"key": "39755647", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8984105464504158, "ground_truth": 0}, {"key": "39755647", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7138307476670792, "ground_truth": 0}, {"key": "39755647", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228122376849, "ground_truth": 0}, {"key": "39755647", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026681948299, "ground_truth": 0}, {"key": "40800537", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.15610489080681486, "ground_truth": 0}, {"key": "40800537", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35756752584747836, "ground_truth": 0}, {"key": "40800537", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.21076631167366147, "ground_truth": 0}, {"key": "40800537", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010666583843887, "ground_truth": 0}, {"key": "40800537", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.27202454209293647, "ground_truth": 0}, {"key": "14171461", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6548947323989202, "ground_truth": 0}, {"key": "14171461", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6150878588246738, "ground_truth": 0}, {"key": "14171461", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7106283104773586, "ground_truth": 0}, {"key": "14171461", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388089704447, "ground_truth": 0}, {"key": "14171461", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583303218112, "ground_truth": 0}, {"key": "36892440", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.21601153279148347, "ground_truth": 0}, {"key": "36892440", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5019531433455579, "ground_truth": 0}, {"key": "36892440", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5467381386329897, "ground_truth": 0}, {"key": "36892440", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093676959492, "ground_truth": 0}, {"key": "36892440", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881546008778, "ground_truth": 0}, {"key": "33733410", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7386690703549268, "ground_truth": 0}, {"key": "33733410", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757646192187028, "ground_truth": 0}, {"key": "33733410", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5467381464067818, "ground_truth": 0}, {"key": "33733410", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026868011261, "ground_truth": 0}, {"key": "33733410", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199149450024, "ground_truth": 0}, {"key": "38587765", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3398276322339477, "ground_truth": 0}, {"key": "38587765", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.23792990690159269, "ground_truth": 0}, {"key": "38587765", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30239108069674037, "ground_truth": 0}, {"key": "38587765", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.1732882030553337, "ground_truth": 0}, {"key": "38587765", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135068964735521, "ground_truth": 0}, {"key": "41065582", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.31912141223735047, "ground_truth": 0}, {"key": "41065582", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45907610269130755, "ground_truth": 0}, {"key": "41065582", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5926665945611342, "ground_truth": 0}, {"key": "41065582", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367170536992, "ground_truth": 0}, {"key": "41065582", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504863278144, "ground_truth": 0}, {"key": "34713891", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2893716998197222, "ground_truth": 0}, {"key": "34713891", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5428632659216991, "ground_truth": 0}, {"key": "34713891", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5486734763213374, "ground_truth": 0}, {"key": "34713891", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.28140560459801023, "ground_truth": 0}, {"key": "34713891", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758335967414, "ground_truth": 0}, {"key": "18913023", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8705972768154687, "ground_truth": 0}, {"key": "18913023", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9489172662512737, "ground_truth": 0}, {"key": "18913023", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8918110498318056, "ground_truth": 0}, {"key": "18913023", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070098972255, "ground_truth": 0}, {"key": "18913023", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107939184597, "ground_truth": 0}, {"key": "36884100", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3812195593428233, "ground_truth": 0}, {"key": "36884100", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3090237148670871, "ground_truth": 0}, {"key": "36884100", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.23231015099803787, "ground_truth": 0}, {"key": "36884100", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36477754325138023, "ground_truth": 0}, {"key": "36884100", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.278256811153448, "ground_truth": 0}, {"key": "39899913", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8643104584193564, "ground_truth": 0}, {"key": "39899913", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8766343687633332, "ground_truth": 0}, {"key": "39899913", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8175744657265966, "ground_truth": 0}, {"key": "39899913", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531298266409, "ground_truth": 0}, {"key": "39899913", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149030356845, "ground_truth": 0}, {"key": "30725366", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.055005285246018616, "ground_truth": 0}, {"key": "30725366", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.10818895535947795, "ground_truth": 0}, {"key": "30725366", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.11201596145786419, "ground_truth": 0}, {"key": "30725366", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.02498779560026993, "ground_truth": 0}, {"key": "30725366", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.052230851511106506, "ground_truth": 0}, {"key": "26133523", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7943849715551018, "ground_truth": 0}, {"key": "26133523", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5486734832297188, "ground_truth": 0}, {"key": "26133523", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7866228094764061, "ground_truth": 0}, {"key": "26133523", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416312185567, "ground_truth": 0}, {"key": "26133523", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585893357362, "ground_truth": 0}, {"key": "29332665", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7217432071012995, "ground_truth": 0}, {"key": "29332665", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8311430575790344, "ground_truth": 0}, {"key": "29332665", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7905303190239625, "ground_truth": 0}, {"key": "29332665", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672119120513, "ground_truth": 0}, {"key": "29332665", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036284971081, "ground_truth": 0}, {"key": "37400481", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8289388135124119, "ground_truth": 0}, {"key": "37400481", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8879840536476583, "ground_truth": 0}, {"key": "37400481", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9167080802929688, "ground_truth": 0}, {"key": "37400481", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9579122712293929, "ground_truth": 0}, {"key": "37400481", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053223098061945, "ground_truth": 0}, {"key": "38787241", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6706082797712575, "ground_truth": 0}, {"key": "38787241", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5156199465310615, "ground_truth": 0}, {"key": "38787241", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6460137073638436, "ground_truth": 0}, {"key": "38787241", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.721743206343345, "ground_truth": 0}, {"key": "38787241", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117166166651771, "ground_truth": 0}, {"key": "38225963", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6495786111478977, "ground_truth": 0}, {"key": "38225963", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.732591844410292, "ground_truth": 0}, {"key": "38225963", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056114411408, "ground_truth": 0}, {"key": "38225963", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918200260044, "ground_truth": 0}, {"key": "38225963", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647802870528, "ground_truth": 0}, {"key": "26072034", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.09947021544887778, "ground_truth": 0}, {"key": "26072034", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.07696083581012801, "ground_truth": 0}, {"key": "26072034", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.21469141473629463, "ground_truth": 0}, {"key": "26072034", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026603227625116, "ground_truth": 0}, {"key": "26072034", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2043419078890629, "ground_truth": 0}, {"key": "35690810", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7620701054208884, "ground_truth": 0}, {"key": "35690810", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8198933280057927, "ground_truth": 0}, {"key": "35690810", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8376199753053075, "ground_truth": 0}, {"key": "35690810", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437450211285, "ground_truth": 0}, {"key": "35690810", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640304614863, "ground_truth": 0}, {"key": "36855665", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9746286882928422, "ground_truth": 0}, {"key": "36855665", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9891815510851806, "ground_truth": 0}, {"key": "36855665", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9742394401209045, "ground_truth": 0}, {"key": "36855665", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9518632236420603, "ground_truth": 0}, {"key": "36855665", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.921357615340188, "ground_truth": 0}, {"key": "29757662", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7279754506567806, "ground_truth": 0}, {"key": "29757662", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7648916286048573, "ground_truth": 0}, {"key": "29757662", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6825737475590707, "ground_truth": 0}, {"key": "29757662", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964094189865, "ground_truth": 0}, {"key": "29757662", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47657965527753177, "ground_truth": 0}, {"key": "19134339", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6774740134784447, "ground_truth": 0}, {"key": "19134339", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7476159379901137, "ground_truth": 0}, {"key": "19134339", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984707983157, "ground_truth": 0}, {"key": "19134339", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.811676004670653, "ground_truth": 0}, {"key": "19134339", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673309768792, "ground_truth": 0}, {"key": "35360732", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8187367987397022, "ground_truth": 0}, {"key": "35360732", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8333246032982263, "ground_truth": 0}, {"key": "35360732", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059208249399, "ground_truth": 0}, {"key": "35360732", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897214180572, "ground_truth": 0}, {"key": "35360732", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424395041938, "ground_truth": 0}, {"key": "37713629", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3557748723404174, "ground_truth": 0}, {"key": "37713629", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.46684561670252517, "ground_truth": 0}, {"key": "37713629", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4054487300818381, "ground_truth": 0}, {"key": "37713629", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758198153039, "ground_truth": 0}, {"key": "37713629", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754067655139056, "ground_truth": 0}, {"key": "33393394", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746221790536, "ground_truth": 0}, {"key": "33393394", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7446563469248089, "ground_truth": 0}, {"key": "33393394", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.75922538716686, "ground_truth": 0}, {"key": "33393394", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575754889891, "ground_truth": 0}, {"key": "33393394", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321761681819, "ground_truth": 0}, {"key": "32275837", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8267118063081119, "ground_truth": 0}, {"key": "32275837", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8714748617515292, "ground_truth": 0}, {"key": "32275837", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8955226785919156, "ground_truth": 0}, {"key": "32275837", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094743623504, "ground_truth": 0}, {"key": "32275837", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338417991763, "ground_truth": 0}, {"key": "21458094", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6261241955084882, "ground_truth": 0}, {"key": "21458094", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39606818305609365, "ground_truth": 0}, {"key": "21458094", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6460136999390113, "ground_truth": 0}, {"key": "21458094", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581706063189, "ground_truth": 0}, {"key": "21458094", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990267677704, "ground_truth": 0}, {"key": "40975362", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8187367954834112, "ground_truth": 0}, {"key": "40975362", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8872046019520977, "ground_truth": 0}, {"key": "40975362", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8333246009647279, "ground_truth": 0}, {"key": "40975362", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338468733739, "ground_truth": 0}, {"key": "40975362", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891227476551, "ground_truth": 0}, {"key": "35234201", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7786493194392466, "ground_truth": 0}, {"key": "35234201", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8407825964467718, "ground_truth": 0}, {"key": "35234201", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6876300215208034, "ground_truth": 0}, {"key": "35234201", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159663872923, "ground_truth": 0}, {"key": "35234201", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690881614405, "ground_truth": 0}, {"key": "36037573", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8092759774328934, "ground_truth": 0}, {"key": "36037573", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085916564979, "ground_truth": 0}, {"key": "36037573", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7786493174547884, "ground_truth": 0}, {"key": "36037573", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392893485568, "ground_truth": 0}, {"key": "36037573", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228303694591, "ground_truth": 0}, {"key": "30861915", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9339146307670574, "ground_truth": 0}, {"key": "30861915", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8661325110987627, "ground_truth": 0}, {"key": "30861915", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9273632982585895, "ground_truth": 0}, {"key": "30861915", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505274994289, "ground_truth": 0}, {"key": "30861915", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9348724467277825, "ground_truth": 0}, {"key": "40173012", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.31912139592463207, "ground_truth": 0}, {"key": "40173012", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.20689403992328623, "ground_truth": 0}, {"key": "40173012", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3056973151897858, "ground_truth": 0}, {"key": "40173012", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.20307463578812895, "ground_truth": 0}, {"key": "40173012", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667159111519046, "ground_truth": 0}, {"key": "35100330", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4804786734545965, "ground_truth": 0}, {"key": "35100330", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5736784204256893, "ground_truth": 0}, {"key": "35100330", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40733339565788523, "ground_truth": 0}, {"key": "35100330", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894533583669, "ground_truth": 0}, {"key": "35100330", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864514823350257, "ground_truth": 0}, {"key": "37220221", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9808759631205346, "ground_truth": 0}, {"key": "37220221", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.971129093073483, "ground_truth": 0}, {"key": "37220221", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9314625132420657, "ground_truth": 0}, {"key": "37220221", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489722070698353, "ground_truth": 0}, {"key": "37220221", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510372848164, "ground_truth": 0}, {"key": "38815218", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9492946365235044, "ground_truth": 0}, {"key": "38815218", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9334308097936814, "ground_truth": 0}, {"key": "38815218", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8558511439798068, "ground_truth": 0}, {"key": "38815218", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.928408806671649, "ground_truth": 0}, {"key": "38815218", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9575961667847577, "ground_truth": 0}, {"key": "39379109", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5717666134971153, "ground_truth": 0}, {"key": "39379109", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42059959611694947, "ground_truth": 0}, {"key": "39379109", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47073660461221034, "ground_truth": 0}, {"key": "39379109", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591020820019, "ground_truth": 0}, {"key": "39379109", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735053146442, "ground_truth": 0}, {"key": "14576125", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.19436781025562908, "ground_truth": 0}, {"key": "14576125", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.23651624039833374, "ground_truth": 0}, {"key": "14576125", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.07423136646941761, "ground_truth": 0}, {"key": "14576125", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.13117322364028278, "ground_truth": 0}, {"key": "14576125", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.031858857404998636, "ground_truth": 0}, {"key": "40814250", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7620701143478544, "ground_truth": 0}, {"key": "40814250", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7295197707600822, "ground_truth": 0}, {"key": "40814250", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8019358233253695, "ground_truth": 0}, {"key": "40814250", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.598312215462446, "ground_truth": 0}, {"key": "40814250", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163558032378, "ground_truth": 0}, {"key": "36334488", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.43014734327408444, "ground_truth": 0}, {"key": "36334488", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45519861514252974, "ground_truth": 0}, {"key": "36334488", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6206216056031706, "ground_truth": 0}, {"key": "36334488", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414088700810155, "ground_truth": 0}, {"key": "36334488", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864512385346136, "ground_truth": 0}, {"key": "36888322", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5869964394670303, "ground_truth": 0}, {"key": "36888322", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4397473618020683, "ground_truth": 0}, {"key": "36888322", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6959583325537786, "ground_truth": 0}, {"key": "36888322", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704719706348, "ground_truth": 0}, {"key": "36888322", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213324910795, "ground_truth": 0}, {"key": "37318916", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8568123078592699, "ground_truth": 0}, {"key": "37318916", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8925625260032156, "ground_truth": 0}, {"key": "37318916", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.896975569758235, "ground_truth": 0}, {"key": "37318916", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9376689673020665, "ground_truth": 0}, {"key": "37318916", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632849029136, "ground_truth": 0}, {"key": "39308700", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.10970577839384775, "ground_truth": 0}, {"key": "39308700", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5907792051324128, "ground_truth": 0}, {"key": "39308700", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3775406568128363, "ground_truth": 0}, {"key": "39308700", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380770951111605, "ground_truth": 0}, {"key": "39308700", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384197167383, "ground_truth": 0}, {"key": "31061543", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6442250905436262, "ground_truth": 0}, {"key": "31061543", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8428631542488859, "ground_truth": 0}, {"key": "31061543", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8289388077273175, "ground_truth": 0}, {"key": "31061543", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9496693661873882, "ground_truth": 0}, {"key": "31061543", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159396151206, "ground_truth": 0}, {"key": "37380894", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9032941991769862, "ground_truth": 0}, {"key": "37380894", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8615382189312625, "ground_truth": 0}, {"key": "37380894", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8529354811457049, "ground_truth": 0}, {"key": "37380894", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578517240405, "ground_truth": 0}, {"key": "37380894", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240853889387, "ground_truth": 0}, {"key": "38410139", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.682573742516065, "ground_truth": 0}, {"key": "38410139", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6723316756055264, "ground_truth": 0}, {"key": "38410139", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490872070754696, "ground_truth": 0}, {"key": "38410139", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228462983446, "ground_truth": 0}, {"key": "38410139", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545696388994, "ground_truth": 0}, {"key": "35953842", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6531269063543519, "ground_truth": 0}, {"key": "35953842", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8568123017899107, "ground_truth": 0}, {"key": "35953842", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7577943703906418, "ground_truth": 0}, {"key": "35953842", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646189467493, "ground_truth": 0}, {"key": "35953842", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228498560143, "ground_truth": 0}, {"key": "39815663", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3174262401411817, "ground_truth": 0}, {"key": "39815663", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.23651622911719594, "ground_truth": 0}, {"key": "39815663", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4205996149154307, "ground_truth": 0}, {"key": "39815663", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553808979534766, "ground_truth": 0}, {"key": "39815663", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2213506947069286, "ground_truth": 0}, {"key": "35121432", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9207896824408592, "ground_truth": 0}, {"key": "35121432", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9278877965602605, "ground_truth": 0}, {"key": "35121432", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8887587942810152, "ground_truth": 0}, {"key": "35121432", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867740709819, "ground_truth": 0}, {"key": "35121432", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825850707342, "ground_truth": 0}, {"key": "21712310", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3684056891891438, "ground_truth": 0}, {"key": "21712310", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.28457599807572276, "ground_truth": 0}, {"key": "21712310", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46490155323477206, "ground_truth": 0}, {"key": "21712310", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.305697322427895, "ground_truth": 0}, {"key": "21712310", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643937170349, "ground_truth": 0}, {"key": "37952914", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8848377670600671, "ground_truth": 0}, {"key": "37952914", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6477982128534772, "ground_truth": 0}, {"key": "37952914", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8925625122812186, "ground_truth": 0}, {"key": "37952914", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799929121608447, "ground_truth": 0}, {"key": "37952914", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284022488342, "ground_truth": 0}, {"key": "38956779", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6076631853997251, "ground_truth": 0}, {"key": "38956779", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4186969161589415, "ground_truth": 0}, {"key": "38956779", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6039318106801921, "ground_truth": 0}, {"key": "38956779", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615950827553, "ground_truth": 0}, {"key": "38956779", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707365767313707, "ground_truth": 0}, {"key": "36101833", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5945512447491047, "ground_truth": 0}, {"key": "36101833", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.720171523553613, "ground_truth": 0}, {"key": "36101833", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6352224116564447, "ground_truth": 0}, {"key": "36101833", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125849521373, "ground_truth": 0}, {"key": "36101833", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943748038921, "ground_truth": 0}, {"key": "35544662", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7662936637046576, "ground_truth": 0}, {"key": "35544662", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717665966891478, "ground_truth": 0}, {"key": "35544662", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.757794380221157, "ground_truth": 0}, {"key": "35544662", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142355281436, "ground_truth": 0}, {"key": "35544662", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358309144786, "ground_truth": 0}, {"key": "39759044", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5583269928034714, "ground_truth": 0}, {"key": "39759044", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4532618482002049, "ground_truth": 0}, {"key": "39759044", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7154239937600936, "ground_truth": 0}, {"key": "39759044", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734810996987, "ground_truth": 0}, {"key": "39759044", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.447460319353076, "ground_truth": 0}, {"key": "39433018", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8832359848652498, "ground_truth": 0}, {"key": "39433018", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7866228340689005, "ground_truth": 0}, {"key": "39433018", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8469578351907417, "ground_truth": 0}, {"key": "39433018", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085737852552, "ground_truth": 0}, {"key": "39433018", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441150237741, "ground_truth": 0}, {"key": "22111959", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297745969060001, "ground_truth": 0}, {"key": "22111959", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4493926205818603, "ground_truth": 0}, {"key": "22111959", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6388352970602622, "ground_truth": 0}, {"key": "22111959", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381506651202, "ground_truth": 0}, {"key": "22111959", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883391891456, "ground_truth": 0}, {"key": "38210094", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5640984958337469, "ground_truth": 0}, {"key": "38210094", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43014736049871516, "ground_truth": 0}, {"key": "38210094", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5755880238062929, "ground_truth": 0}, {"key": "38210094", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570646584175904, "ground_truth": 0}, {"key": "38210094", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092208224262192, "ground_truth": 0}, {"key": "37675935", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.27357438402217693, "ground_truth": 0}, {"key": "37675935", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6495786031065743, "ground_truth": 0}, {"key": "37675935", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5888891198537907, "ground_truth": 0}, {"key": "37675935", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704631738302, "ground_truth": 0}, {"key": "37675935", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073659468624984, "ground_truth": 0}, {"key": "35732604", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2689414186086984, "ground_truth": 0}, {"key": "35732604", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.19314738016712252, "ground_truth": 0}, {"key": "35732604", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.15304215674747357, "ground_truth": 0}, {"key": "35732604", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310452054407, "ground_truth": 0}, {"key": "35732604", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953522068730542, "ground_truth": 0}, {"key": "27453212", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6893056162590045, "ground_truth": 0}, {"key": "27453212", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6113819617375601, "ground_truth": 0}, {"key": "27453212", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.818736792842015, "ground_truth": 0}, {"key": "27453212", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759806159747, "ground_truth": 0}, {"key": "27453212", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680131940772, "ground_truth": 0}, {"key": "39910047", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.386763468438226, "ground_truth": 0}, {"key": "39910047", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5175708833379722, "ground_truth": 0}, {"key": "39910047", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984686704843, "ground_truth": 0}, {"key": "39910047", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.449392641919965, "ground_truth": 0}, {"key": "39910047", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606818427763746, "ground_truth": 0}, {"key": "40054265", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5907791924762642, "ground_truth": 0}, {"key": "40054265", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5467381366370585, "ground_truth": 0}, {"key": "40054265", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4649015710938639, "ground_truth": 0}, {"key": "40054265", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583143463873, "ground_truth": 0}, {"key": "40054265", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804263446486, "ground_truth": 0}, {"key": "19984615", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5058590986510049, "ground_truth": 0}, {"key": "19984615", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.505859095363762, "ground_truth": 0}, {"key": "19984615", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42823341927912517, "ground_truth": 0}, {"key": "19984615", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573599051524914, "ground_truth": 0}, {"key": "19984615", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633154030924747, "ground_truth": 0}, {"key": "16490806", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.537041360618239, "ground_truth": 0}, {"key": "16490806", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4455295161993281, "ground_truth": 0}, {"key": "16490806", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47657964103184886, "ground_truth": 0}, {"key": "16490806", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016878137549625, "ground_truth": 0}, {"key": "16490806", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320633833519921, "ground_truth": 0}, {"key": "36396237", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.950410974901227, "ground_truth": 0}, {"key": "36396237", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9224823432293956, "ground_truth": 0}, {"key": "36396237", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9372107864524263, "ground_truth": 0}, {"key": "36396237", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9575961739170877, "ground_truth": 0}, {"key": "36396237", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.939024822052751, "ground_truth": 0}, {"key": "40726444", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4339814383690279, "ground_truth": 0}, {"key": "40726444", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6513548552602549, "ground_truth": 0}, {"key": "40726444", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5851011384424207, "ground_truth": 0}, {"key": "40726444", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4707366187457814, "ground_truth": 0}, {"key": "40726444", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476843783863, "ground_truth": 0}, {"key": "37314826", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3812195735904869, "ground_truth": 0}, {"key": "37314826", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3363310554577691, "ground_truth": 0}, {"key": "37314826", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5039061784782528, "ground_truth": 0}, {"key": "37314826", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.443600420652361, "ground_truth": 0}, {"key": "37314826", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310531991478, "ground_truth": 0}, {"key": "38506971", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5583269717133923, "ground_truth": 0}, {"key": "38506971", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.592666596916897, "ground_truth": 0}, {"key": "38506971", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4571367097841167, "ground_truth": 0}, {"key": "38506971", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297745984531502, "ground_truth": 0}, {"key": "38506971", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.310694370991176, "ground_truth": 0}, {"key": "40699312", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8407825836262763, "ground_truth": 0}, {"key": "40699312", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8910549528015493, "ground_truth": 0}, {"key": "40699312", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9073122171324556, "ground_truth": 0}, {"key": "40699312", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767969735567, "ground_truth": 0}, {"key": "40699312", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9319595788994584, "ground_truth": 0}, {"key": "34695474", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7008948275591237, "ground_truth": 0}, {"key": "34695474", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.832236649436973, "ground_truth": 0}, {"key": "34695474", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7106283008782054, "ground_truth": 0}, {"key": "34695474", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.699254413102583, "ground_truth": 0}, {"key": "34695474", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300702346046, "ground_truth": 0}, {"key": "36281498", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8529354710139084, "ground_truth": 0}, {"key": "36281498", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948112108941, "ground_truth": 0}, {"key": "36281498", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7310585884305257, "ground_truth": 0}, {"key": "36281498", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743633484892, "ground_truth": 0}, {"key": "36281498", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48242909062517336, "ground_truth": 0}, {"key": "39558652", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40356686008808546, "ground_truth": 0}, {"key": "39558652", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43398145566538976, "ground_truth": 0}, {"key": "39558652", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6039318398465422, "ground_truth": 0}, {"key": "39558652", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583270145082067, "ground_truth": 0}, {"key": "39558652", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792106468329, "ground_truth": 0}, {"key": "37330579", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.37754066093897254, "ground_truth": 0}, {"key": "37330579", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33285233500022, "ground_truth": 0}, {"key": "37330579", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3157359875967299, "ground_truth": 0}, {"key": "37330579", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.28457600609285794, "ground_truth": 0}, {"key": "37330579", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2583259963678765, "ground_truth": 0}, {"key": "40547658", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6671476958248497, "ground_truth": 0}, {"key": "40547658", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544238479472, "ground_truth": 0}, {"key": "40547658", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6224593213098462, "ground_truth": 0}, {"key": "40547658", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174850944959, "ground_truth": 0}, {"key": "40547658", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.611381977197794, "ground_truth": 0}, {"key": "37119340", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.680878625527391, "ground_truth": 0}, {"key": "37119340", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5563995805997306, "ground_truth": 0}, {"key": "37119340", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358280249372, "ground_truth": 0}, {"key": "37119340", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690818433002, "ground_truth": 0}, {"key": "37119340", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688308108921, "ground_truth": 0}, {"key": "35301627", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7025300459016106, "ground_truth": 0}, {"key": "35301627", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5117165875193351, "ground_truth": 0}, {"key": "35301627", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6406358490183679, "ground_truth": 0}, {"key": "35301627", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717665874624662, "ground_truth": 0}, {"key": "35301627", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647718533993, "ground_truth": 0}, {"key": "34037168", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3757064637709056, "ground_truth": 0}, {"key": "34037168", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2925953093806968, "ground_truth": 0}, {"key": "34037168", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3073580314423703, "ground_truth": 0}, {"key": "34037168", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208213315237832, "ground_truth": 0}, {"key": "34037168", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.336331069122392, "ground_truth": 0}, {"key": "39703862", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9246876926475365, "ground_truth": 0}, {"key": "39703862", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9575961714986749, "ground_truth": 0}, {"key": "39703862", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9136765255279542, "ground_truth": 0}, {"key": "39703862", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.929440404366189, "ground_truth": 0}, {"key": "39703862", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9284087995045757, "ground_truth": 0}, {"key": "16554814", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7786493146662112, "ground_truth": 0}, {"key": "16554814", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6076631532385638, "ground_truth": 0}, {"key": "16554814", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7520126087555772, "ground_truth": 0}, {"key": "16554814", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928956120842, "ground_truth": 0}, {"key": "16554814", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061836457911, "ground_truth": 0}, {"key": "32983099", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.26740815072622803, "ground_truth": 0}, {"key": "32983099", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.1490352947521359, "ground_truth": 0}, {"key": "32983099", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3904758527143642, "ground_truth": 0}, {"key": "32983099", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015225595132, "ground_truth": 0}, {"key": "32983099", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591052224557, "ground_truth": 0}, {"key": "41072994", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3998116387941615, "ground_truth": 0}, {"key": "41072994", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6619228607649954, "ground_truth": 0}, {"key": "41072994", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2814056134682054, "ground_truth": 0}, {"key": "41072994", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632157481550054, "ground_truth": 0}, {"key": "41072994", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864512952207444, "ground_truth": 0}, {"key": "38396247", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8749346296264456, "ground_truth": 0}, {"key": "38396247", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085855314733, "ground_truth": 0}, {"key": "38396247", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9489172603738687, "ground_truth": 0}, {"key": "38396247", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545580502444, "ground_truth": 0}, {"key": "38396247", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9525741245153937, "ground_truth": 0}, {"key": "37507998", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7648916094391454, "ground_truth": 0}, {"key": "37507998", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358344959641, "ground_truth": 0}, {"key": "37507998", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8128673206530189, "ground_truth": 0}, {"key": "37507998", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673169364435, "ground_truth": 0}, {"key": "37507998", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.845942437069995, "ground_truth": 0}, {"key": "32593929", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4863315334062124, "ground_truth": 0}, {"key": "32593929", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.723309453485576, "ground_truth": 0}, {"key": "32593929", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46684561878260616, "ground_truth": 0}, {"key": "32593929", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.542863255935171, "ground_truth": 0}, {"key": "32593929", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.560252639115214, "ground_truth": 0}, {"key": "36056449", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4244119845380728, "ground_truth": 0}, {"key": "36056449", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.455198597852573, "ground_truth": 0}, {"key": "36056449", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170118682216624, "ground_truth": 0}, {"key": "36056449", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743518139137, "ground_truth": 0}, {"key": "36056449", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033281331254, "ground_truth": 0}, {"key": "21986185", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2704802267714953, "ground_truth": 0}, {"key": "21986185", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.17441028018042734, "ground_truth": 0}, {"key": "21986185", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.19436781989366977, "ground_truth": 0}, {"key": "21986185", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.1847675039888071, "ground_truth": 0}, {"key": "21986185", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608724592490505, "ground_truth": 0}, {"key": "40757465", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5679366184143144, "ground_truth": 0}, {"key": "40757465", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7341195332294325, "ground_truth": 0}, {"key": "40757465", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5563995775893904, "ground_truth": 0}, {"key": "40757465", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964533535263, "ground_truth": 0}, {"key": "40757465", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566583110598591, "ground_truth": 0}, {"key": "35198313", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7122322026973635, "ground_truth": 0}, {"key": "35198313", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5794003977583886, "ground_truth": 0}, {"key": "35198313", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5019531350760096, "ground_truth": 0}, {"key": "35198313", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593159719936, "ground_truth": 0}, {"key": "35198313", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397546822112, "ground_truth": 0}, {"key": "30604618", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7549149832111894, "ground_truth": 0}, {"key": "30604618", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7057850000794379, "ground_truth": 0}, {"key": "30604618", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9079671451818313, "ground_truth": 0}, {"key": "30604618", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125917372181, "ground_truth": 0}, {"key": "30604618", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031738215674781, "ground_truth": 0}, {"key": "35779006", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6825737285586446, "ground_truth": 0}, {"key": "35779006", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6619228532828867, "ground_truth": 0}, {"key": "35779006", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38676347814611656, "ground_truth": 0}, {"key": "35779006", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424402577286, "ground_truth": 0}, {"key": "35779006", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666009410117, "ground_truth": 0}, {"key": "33858956", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419715106321, "ground_truth": 0}, {"key": "33858956", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506628337705, "ground_truth": 0}, {"key": "33858956", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7122321954015947, "ground_truth": 0}, {"key": "33858956", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.789233685753222, "ground_truth": 0}, {"key": "33858956", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358493642975, "ground_truth": 0}, {"key": "38633880", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.32082127408755756, "ground_truth": 0}, {"key": "38633880", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33111974082611323, "ground_truth": 0}, {"key": "38633880", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4629586427749284, "ground_truth": 0}, {"key": "38633880", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551985887082582, "ground_truth": 0}, {"key": "38633880", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544874177640244, "ground_truth": 0}, {"key": "36654905", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9871787867649332, "ground_truth": 0}, {"key": "36654905", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9902915240597108, "ground_truth": 0}, {"key": "36654905", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9757623638721653, "ground_truth": 0}, {"key": "36654905", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9559813560074254, "ground_truth": 0}, {"key": "36654905", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9612438061208175, "ground_truth": 0}, {"key": "26547482", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "26547482", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3684056918072559, "ground_truth": 0}, {"key": "26547482", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4436004120052489, "ground_truth": 0}, {"key": "26547482", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.29421495525810926, "ground_truth": 0}, {"key": "26547482", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618516789965, "ground_truth": 0}, {"key": "36439068", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6992544306577246, "ground_truth": 0}, {"key": "36439068", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6740504796796934, "ground_truth": 0}, {"key": "36439068", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3830641642915117, "ground_truth": 0}, {"key": "36439068", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035574425152, "ground_truth": 0}, {"key": "36439068", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320633822993937, "ground_truth": 0}, {"key": "30501258", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7745833740711926, "ground_truth": 0}, {"key": "30501258", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8449215342697796, "ground_truth": 0}, {"key": "30501258", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5888891364464012, "ground_truth": 0}, {"key": "30501258", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802374612156, "ground_truth": 0}, {"key": "30501258", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802733372998, "ground_truth": 0}, {"key": "37560941", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7866228311001375, "ground_truth": 0}, {"key": "37560941", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8198933417159869, "ground_truth": 0}, {"key": "37560941", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7025300408183878, "ground_truth": 0}, {"key": "37560941", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835396893149, "ground_truth": 0}, {"key": "37560941", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737922537422, "ground_truth": 0}, {"key": "36801665", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8255897216717609, "ground_truth": 0}, {"key": "36801665", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9241418253933449, "ground_truth": 0}, {"key": "36801665", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.848972208798478, "ground_truth": 0}, {"key": "36801665", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.906653120697261, "ground_truth": 0}, {"key": "36801665", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178965111057, "ground_truth": 0}, {"key": "34954610", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7008948059988245, "ground_truth": 0}, {"key": "34954610", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3328523215762764, "ground_truth": 0}, {"key": "34954610", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292633852859642, "ground_truth": 0}, {"key": "34954610", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883618124888, "ground_truth": 0}, {"key": "34954610", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527627059275, "ground_truth": 0}, {"key": "37020510", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8438950845985544, "ground_truth": 0}, {"key": "37020510", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8068526242021702, "ground_truth": 0}, {"key": "37020510", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8740772294945636, "ground_truth": 0}, {"key": "37020510", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145767643607, "ground_truth": 0}, {"key": "37020510", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104788840795542, "ground_truth": 0}, {"key": "38064637", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.339827619664087, "ground_truth": 0}, {"key": "38064637", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2509127766318744, "ground_truth": 0}, {"key": "38064637", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2523840515319785, "ground_truth": 0}, {"key": "38064637", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074558716084276, "ground_truth": 0}, {"key": "38064637", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1500288158723654, "ground_truth": 0}, {"key": "40886108", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9149009446259119, "ground_truth": 0}, {"key": "40886108", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9390248212377388, "ground_truth": 0}, {"key": "40886108", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9429286072910973, "ground_truth": 0}, {"key": "40886108", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179887756533, "ground_truth": 0}, {"key": "40886108", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9569571525662387, "ground_truth": 0}, {"key": "38554603", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804152231806, "ground_truth": 0}, {"key": "38554603", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8116760223208865, "ground_truth": 0}, {"key": "38554603", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.638835286749408, "ground_truth": 0}, {"key": "38554603", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990332806088, "ground_truth": 0}, {"key": "38554603", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850384838253, "ground_truth": 0}, {"key": "39115586", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45132650326646023, "ground_truth": 0}, {"key": "39115586", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358210797515, "ground_truth": 0}, {"key": "39115586", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5331543983360643, "ground_truth": 0}, {"key": "39115586", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666025987081, "ground_truth": 0}, {"key": "39115586", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850174723184, "ground_truth": 0}, {"key": "38786314", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6566582630175046, "ground_truth": 0}, {"key": "38786314", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6584175150129149, "ground_truth": 0}, {"key": "38786314", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8278281468527198, "ground_truth": 0}, {"key": "38786314", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583341533807, "ground_truth": 0}, {"key": "38786314", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920102395688, "ground_truth": 0}, {"key": "38721078", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.92078967330236, "ground_truth": 0}, {"key": "38721078", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9046505367885773, "ground_truth": 0}, {"key": "38721078", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9130583404068214, "ground_truth": 0}, {"key": "38721078", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414777800492, "ground_truth": 0}, {"key": "38721078", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765270869935, "ground_truth": 0}, {"key": "39475467", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575566402776, "ground_truth": 0}, {"key": "39475467", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6584174978066993, "ground_truth": 0}, {"key": "39475467", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7690802410109955, "ground_truth": 0}, {"key": "39475467", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389996264792, "ground_truth": 0}, {"key": "39475467", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869878797658, "ground_truth": 0}, {"key": "35691234", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8187367963583421, "ground_truth": 0}, {"key": "35691234", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5117165836555508, "ground_truth": 0}, {"key": "35691234", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46295859920180954, "ground_truth": 0}, {"key": "35691234", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.596433123647979, "ground_truth": 0}, {"key": "35691234", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615964388956, "ground_truth": 0}, {"key": "36871390", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419761576992, "ground_truth": 0}, {"key": "36871390", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7505527459992968, "ground_truth": 0}, {"key": "36871390", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.627951218075548, "ground_truth": 0}, {"key": "36871390", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.562176500165363, "ground_truth": 0}, {"key": "36871390", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891460594095, "ground_truth": 0}, {"key": "31730844", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5583270053455016, "ground_truth": 0}, {"key": "31730844", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35042136356255, "ground_truth": 0}, {"key": "31730844", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5813030775168809, "ground_truth": 0}, {"key": "31730844", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.472683493499149, "ground_truth": 0}, {"key": "31730844", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121441757403, "ground_truth": 0}, {"key": "30810940", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49218812506671417, "ground_truth": 0}, {"key": "30810940", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.47463119149962835, "ground_truth": 0}, {"key": "30810940", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.682573727833161, "ground_truth": 0}, {"key": "30810940", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743747197147, "ground_truth": 0}, {"key": "30810940", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.525368830146685, "ground_truth": 0}, {"key": "39352003", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8661325123481906, "ground_truth": 0}, {"key": "39352003", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8558511601738398, "ground_truth": 0}, {"key": "39352003", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9155072449393554, "ground_truth": 0}, {"key": "39352003", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9507778833849964, "ground_truth": 0}, {"key": "39352003", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9314625026867625, "ground_truth": 0}, {"key": "40118123", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47657966781575, "ground_truth": 0}, {"key": "40118123", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6057990425945013, "ground_truth": 0}, {"key": "40118123", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5486734950533836, "ground_truth": 0}, {"key": "40118123", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318502226566, "ground_truth": 0}, {"key": "40118123", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765138300117, "ground_truth": 0}, {"key": "37114191", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5851011528706637, "ground_truth": 0}, {"key": "37114191", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4610167858691357, "ground_truth": 0}, {"key": "37114191", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6388352662396183, "ground_truth": 0}, {"key": "37114191", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316970428932, "ground_truth": 0}, {"key": "37114191", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512048192771, "ground_truth": 0}, {"key": "39268203", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8918110427078991, "ground_truth": 0}, {"key": "39268203", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7676898628773682, "ground_truth": 0}, {"key": "39268203", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8615382194298089, "ground_truth": 0}, {"key": "39268203", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.777299855306508, "ground_truth": 0}, {"key": "39268203", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324838068028, "ground_truth": 0}, {"key": "37950968", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7264256211583002, "ground_truth": 0}, {"key": "37950968", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2798285052615146, "ground_truth": 0}, {"key": "37950968", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292633842775039, "ground_truth": 0}, {"key": "37950968", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990374413101, "ground_truth": 0}, {"key": "37950968", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632807077086, "ground_truth": 0}, {"key": "34959807", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7201715318247548, "ground_truth": 0}, {"key": "34959807", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7041601340264524, "ground_truth": 0}, {"key": "34959807", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7994423240854309, "ground_truth": 0}, {"key": "34959807", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702744536246, "ground_truth": 0}, {"key": "34959807", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476863794206, "ground_truth": 0}, {"key": "35631314", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9309620723897444, "ground_truth": 0}, {"key": "35631314", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8998277824769743, "ground_truth": 0}, {"key": "35631314", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9473810498532317, "ground_truth": 0}, {"key": "35631314", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681117120384, "ground_truth": 0}, {"key": "35631314", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.961533807743559, "ground_truth": 0}, {"key": "38082365", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8322366463780274, "ground_truth": 0}, {"key": "38082365", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9190632948927207, "ground_truth": 0}, {"key": "38082365", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8529354790911324, "ground_truth": 0}, {"key": "38082365", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110457919867, "ground_truth": 0}, {"key": "38082365", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009503747236, "ground_truth": 0}, {"key": "37242829", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7154240305686959, "ground_truth": 0}, {"key": "37242829", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.437823481231076, "ground_truth": 0}, {"key": "37242829", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3702253665482251, "ground_truth": 0}, {"key": "37242829", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358417407005, "ground_truth": 0}, {"key": "37242829", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.31069434959187503, "ground_truth": 0}, {"key": "38556068", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.31237001880157395, "ground_truth": 0}, {"key": "38556068", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6406358742813071, "ground_truth": 0}, {"key": "38556068", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5467381317939924, "ground_truth": 0}, {"key": "38556068", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185305315026, "ground_truth": 0}, {"key": "38556068", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786756672733, "ground_truth": 0}, {"key": "32969336", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7943849586049634, "ground_truth": 0}, {"key": "32969336", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8615382139218984, "ground_truth": 0}, {"key": "32969336", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7386690423072382, "ground_truth": 0}, {"key": "32969336", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948013787064, "ground_truth": 0}, {"key": "32969336", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094795938617, "ground_truth": 0}, {"key": "36825153", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.24508502356721065, "ground_truth": 0}, {"key": "36825153", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.44939263027625964, "ground_truth": 0}, {"key": "36825153", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3140505359108684, "ground_truth": 0}, {"key": "36825153", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436782434306885, "ground_truth": 0}, {"key": "36825153", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491214643368726, "ground_truth": 0}, {"key": "41050146", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9299510360510957, "ground_truth": 0}, {"key": "41050146", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8661325104959179, "ground_truth": 0}, {"key": "41050146", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8587185749140976, "ground_truth": 0}, {"key": "41050146", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517133828768, "ground_truth": 0}, {"key": "41050146", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204038618521, "ground_truth": 0}, {"key": "27865037", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6654105336601117, "ground_truth": 0}, {"key": "27865037", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.41489885803954546, "ground_truth": 0}, {"key": "27865037", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38121959816504863, "ground_truth": 0}, {"key": "27865037", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.592666597704678, "ground_truth": 0}, {"key": "27865037", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935426104564, "ground_truth": 0}, {"key": "39868565", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6909762786100643, "ground_truth": 0}, {"key": "39868565", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7386690669234975, "ground_truth": 0}, {"key": "39868565", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7201714854574596, "ground_truth": 0}, {"key": "39868565", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445480530732, "ground_truth": 0}, {"key": "39868565", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.796925380615996, "ground_truth": 0}, {"key": "37761968", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6206216059457808, "ground_truth": 0}, {"key": "37761968", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7386690843895973, "ground_truth": 0}, {"key": "37761968", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7648916232894547, "ground_truth": 0}, {"key": "37761968", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943682167377, "ground_truth": 0}, {"key": "37761968", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195100438679, "ground_truth": 0}, {"key": "16326139", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.22270013647506257, "ground_truth": 0}, {"key": "16326139", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.44360044375703345, "ground_truth": 0}, {"key": "16326139", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.23651623682972625, "ground_truth": 0}, {"key": "16326139", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.399811651034093, "ground_truth": 0}, {"key": "16326139", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.36840569275593404, "ground_truth": 0}, {"key": "36568381", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6791786935821879, "ground_truth": 0}, {"key": "36568381", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.581303077986965, "ground_truth": 0}, {"key": "36568381", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085839077507, "ground_truth": 0}, {"key": "36568381", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802493754071, "ground_truth": 0}, {"key": "36568381", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880160558817, "ground_truth": 0}, {"key": "39855613", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7994423082618368, "ground_truth": 0}, {"key": "39855613", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9005297829539712, "ground_truth": 0}, {"key": "39855613", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9412234501734197, "ground_truth": 0}, {"key": "39855613", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672258710047, "ground_truth": 0}, {"key": "39855613", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840548998126, "ground_truth": 0}, {"key": "29856302", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5983122248202851, "ground_truth": 0}, {"key": "29856302", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6774740315673348, "ground_truth": 0}, {"key": "29856302", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6757646086147199, "ground_truth": 0}, {"key": "29856302", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743614662142, "ground_truth": 0}, {"key": "29856302", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414029437524, "ground_truth": 0}, {"key": "35641106", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7772998375288374, "ground_truth": 0}, {"key": "35641106", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7676898469966925, "ground_truth": 0}, {"key": "35641106", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8056321734249251, "ground_truth": 0}, {"key": "35641106", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026835885076, "ground_truth": 0}, {"key": "35641106", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740138104932, "ground_truth": 0}, {"key": "39474558", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5621765014036066, "ground_truth": 0}, {"key": "39474558", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5736783867076749, "ground_truth": 0}, {"key": "39474558", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32939169652148637, "ground_truth": 0}, {"key": "39474558", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723853442721, "ground_truth": 0}, {"key": "39474558", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300580113467, "ground_truth": 0}, {"key": "34338135", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8587185699822381, "ground_truth": 0}, {"key": "34338135", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8791467713408634, "ground_truth": 0}, {"key": "34338135", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7248702718770276, "ground_truth": 0}, {"key": "34338135", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9343951628449494, "ground_truth": 0}, {"key": "34338135", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797661609298, "ground_truth": 0}, {"key": "35870330", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7549149872215954, "ground_truth": 0}, {"key": "35870330", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8344068957874455, "ground_truth": 0}, {"key": "35870330", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7264255769044627, "ground_truth": 0}, {"key": "35870330", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338520539193, "ground_truth": 0}, {"key": "35870330", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849539311344, "ground_truth": 0}, {"key": "24478245", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8198933537320817, "ground_truth": 0}, {"key": "24478245", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8925625272230655, "ground_truth": 0}, {"key": "24478245", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7799929175693855, "ground_truth": 0}, {"key": "24478245", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110522453259, "ground_truth": 0}, {"key": "24478245", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299586452899, "ground_truth": 0}, {"key": "38485946", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7386691066594038, "ground_truth": 0}, {"key": "38485946", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6671476959467406, "ground_truth": 0}, {"key": "38485946", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.685949482813485, "ground_truth": 0}, {"key": "38485946", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366499681271, "ground_truth": 0}, {"key": "38485946", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689264596685, "ground_truth": 0}, {"key": "32509613", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8940517262372292, "ground_truth": 0}, {"key": "32509613", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.790530308610938, "ground_truth": 0}, {"key": "32509613", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8539127460235103, "ground_truth": 0}, {"key": "32509613", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545703516907, "ground_truth": 0}, {"key": "32509613", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053223000094702, "ground_truth": 0}, {"key": "34078819", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8479677601133586, "ground_truth": 0}, {"key": "34078819", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6584175087932652, "ground_truth": 0}, {"key": "34078819", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9241418263518827, "ground_truth": 0}, {"key": "34078819", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267773789699, "ground_truth": 0}, {"key": "34078819", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.890294228062691, "ground_truth": 0}, {"key": "39523865", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5331544035882001, "ground_truth": 0}, {"key": "39523865", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7676898639406887, "ground_truth": 0}, {"key": "39523865", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490872075689533, "ground_truth": 0}, {"key": "39523865", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.571766609489649, "ground_truth": 0}, {"key": "39523865", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315943177710895, "ground_truth": 0}, {"key": "33146158", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.803173789093808, "ground_truth": 0}, {"key": "33146158", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6926419917003295, "ground_truth": 0}, {"key": "33146158", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.63341027192384, "ground_truth": 0}, {"key": "33146158", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819585051755, "ground_truth": 0}, {"key": "33146158", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165148022677, "ground_truth": 0}, {"key": "32083974", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.737158164017372, "ground_truth": 0}, {"key": "32083974", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6113819456936729, "ground_truth": 0}, {"key": "32083974", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8104789307220066, "ground_truth": 0}, {"key": "32083974", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995809144802, "ground_truth": 0}, {"key": "32083974", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.656658239987189, "ground_truth": 0}, {"key": "34378482", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9477691477494595, "ground_truth": 0}, {"key": "34378482", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.93534651160876, "ground_truth": 0}, {"key": "34378482", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9612438050515013, "ground_truth": 0}, {"key": "34378482", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267960847076, "ground_truth": 0}, {"key": "34378482", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646904097945, "ground_truth": 0}, {"key": "38080102", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6076631723261465, "ground_truth": 0}, {"key": "38080102", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4804786879017251, "ground_truth": 0}, {"key": "38080102", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4016877928469406, "ground_truth": 0}, {"key": "38080102", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356685684883115, "ground_truth": 0}, {"key": "38080102", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969180057638, "ground_truth": 0}, {"key": "40244537", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.663668962236951, "ground_truth": 0}, {"key": "40244537", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8104789076163246, "ground_truth": 0}, {"key": "40244537", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7310585932085516, "ground_truth": 0}, {"key": "40244537", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195249426002, "ground_truth": 0}, {"key": "40244537", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740088810481, "ground_truth": 0}, {"key": "33497789", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9130583383578158, "ground_truth": 0}, {"key": "33497789", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9118099441465706, "ground_truth": 0}, {"key": "33497789", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8548846332143766, "ground_truth": 0}, {"key": "33497789", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359891070798, "ground_truth": 0}, {"key": "33497789", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337004647418, "ground_truth": 0}, {"key": "28816889", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8210441160356103, "ground_truth": 0}, {"key": "28816889", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8816149019617269, "ground_truth": 0}, {"key": "28816889", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9161096195593708, "ground_truth": 0}, {"key": "28816889", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068875554307, "ground_truth": 0}, {"key": "28816889", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897150006296, "ground_truth": 0}, {"key": "38157127", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47463115364712144, "ground_truth": 0}, {"key": "38157127", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5136684507661633, "ground_truth": 0}, {"key": "38157127", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.348645133915987, "ground_truth": 0}, {"key": "38157127", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39793842636224114, "ground_truth": 0}, {"key": "38157127", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436741509917, "ground_truth": 0}, {"key": "36183569", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4186969447944143, "ground_truth": 0}, {"key": "36183569", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40733339977356914, "ground_truth": 0}, {"key": "36183569", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4320633957921285, "ground_truth": 0}, {"key": "36183569", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.33982762842491643, "ground_truth": 0}, {"key": "36183569", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.556399583413709, "ground_truth": 0}, {"key": "36012016", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6992544117896567, "ground_truth": 0}, {"key": "36012016", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791786831870646, "ground_truth": 0}, {"key": "36012016", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.861538198632693, "ground_truth": 0}, {"key": "36012016", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026748865144, "ground_truth": 0}, {"key": "36012016", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.803173794249372, "ground_truth": 0}, {"key": "34571973", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6959583447328279, "ground_truth": 0}, {"key": "34571973", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7401743711900061, "ground_truth": 0}, {"key": "34571973", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7549150056442525, "ground_truth": 0}, {"key": "34571973", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251061639181, "ground_truth": 0}, {"key": "34571973", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299865065961, "ground_truth": 0}, {"key": "38707498", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8376199515073736, "ground_truth": 0}, {"key": "38707498", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8856314640671541, "ground_truth": 0}, {"key": "38707498", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.731058600124804, "ground_truth": 0}, {"key": "38707498", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850329417109, "ground_truth": 0}, {"key": "38707498", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336986499209, "ground_truth": 0}, {"key": "35459082", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9750122048540981, "ground_truth": 0}, {"key": "35459082", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9770226295328666, "ground_truth": 0}, {"key": "35459082", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9768465911353248, "ground_truth": 0}, {"key": "35459082", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9713473305862825, "ground_truth": 0}, {"key": "35459082", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9324533051338161, "ground_truth": 0}, {"key": "39464041", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.973644644498093, "ground_truth": 0}, {"key": "39464041", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9724147171399168, "ground_truth": 0}, {"key": "39464041", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9777138169807333, "ground_truth": 0}, {"key": "39464041", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.976846587607156, "ground_truth": 0}, {"key": "39464041", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9753900707499691, "ground_truth": 0}, {"key": "23782052", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41679664513328046, "ground_truth": 0}, {"key": "23782052", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.737158146896679, "ground_truth": 0}, {"key": "23782052", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6548947202543267, "ground_truth": 0}, {"key": "23782052", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823338705420144, "ground_truth": 0}, {"key": "23782052", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.42250464241036706, "ground_truth": 0}, {"key": "36568455", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7676898515563514, "ground_truth": 0}, {"key": "36568455", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8438951112953256, "ground_truth": 0}, {"key": "36568455", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8969755746420721, "ground_truth": 0}, {"key": "36568455", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.880797090110565, "ground_truth": 0}, {"key": "36568455", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677655873796, "ground_truth": 0}, {"key": "38469552", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8679338354782452, "ground_truth": 0}, {"key": "38469552", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8879840499638828, "ground_truth": 0}, {"key": "38469552", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8643104557450595, "ground_truth": 0}, {"key": "38469552", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.904650526637319, "ground_truth": 0}, {"key": "38469552", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517147173309, "ground_truth": 0}, {"key": "35922277", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9263037196498761, "ground_truth": 0}, {"key": "35922277", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9136765229386614, "ground_truth": 0}, {"key": "35922277", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9184802437510636, "ground_truth": 0}, {"key": "35922277", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218375796838, "ground_truth": 0}, {"key": "35922277", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9343951642290064, "ground_truth": 0}, {"key": "32744293", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7295197701750916, "ground_truth": 0}, {"key": "32744293", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7704647708794071, "ground_truth": 0}, {"key": "32744293", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8354835396676797, "ground_truth": 0}, {"key": "32744293", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281395704881, "ground_truth": 0}, {"key": "32744293", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366575386562, "ground_truth": 0}, {"key": "30972362", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9539660947918343, "ground_truth": 0}, {"key": "30972362", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9683812328997148, "ground_truth": 0}, {"key": "30972362", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9629528315275983, "ground_truth": 0}, {"key": "30972362", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.941654161090746, "ground_truth": 0}, {"key": "30972362", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9588471080762955, "ground_truth": 0}, {"key": "36380943", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7008948127711399, "ground_truth": 0}, {"key": "36380943", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8044059134128915, "ground_truth": 0}, {"key": "36380943", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7690802233867937, "ground_truth": 0}, {"key": "36380943", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933324700655, "ground_truth": 0}, {"key": "36380943", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936454232198, "ground_truth": 0}, {"key": "36929355", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6943026954060683, "ground_truth": 0}, {"key": "36929355", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4571367032041968, "ground_truth": 0}, {"key": "36929355", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7549149984145486, "ground_truth": 0}, {"key": "36929355", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089203968602, "ground_truth": 0}, {"key": "36929355", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008947900787654, "ground_truth": 0}, {"key": "39127206", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7786493197909283, "ground_truth": 0}, {"key": "39127206", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.49218812953827146, "ground_truth": 0}, {"key": "39127206", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6206215766190941, "ground_truth": 0}, {"key": "39127206", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737836165445, "ground_truth": 0}, {"key": "39127206", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704718638219, "ground_truth": 0}, {"key": "36128318", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3738758064024871, "ground_truth": 0}, {"key": "36128318", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.27825680040910916, "ground_truth": 0}, {"key": "36128318", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22815650393626455, "ground_truth": 0}, {"key": "36128318", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.25982563519999446, "ground_truth": 0}, {"key": "36128318", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.15817434785171708, "ground_truth": 0}, {"key": "39863480", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8428631310729126, "ground_truth": 0}, {"key": "39863480", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9092645078538706, "ground_truth": 0}, {"key": "39863480", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.844921526403466, "ground_truth": 0}, {"key": "39863480", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884660985273, "ground_truth": 0}, {"key": "39863480", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185804313291, "ground_truth": 0}, {"key": "38634057", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8969755766703841, "ground_truth": 0}, {"key": "38634057", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8723473808374812, "ground_truth": 0}, {"key": "38634057", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8902942260419228, "ground_truth": 0}, {"key": "38634057", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354775972973, "ground_truth": 0}, {"key": "38634057", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575642416277, "ground_truth": 0}, {"key": "33131935", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.906653117438889, "ground_truth": 0}, {"key": "33131935", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.863391623924433, "ground_truth": 0}, {"key": "33131935", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9309620741103855, "ground_truth": 0}, {"key": "33131935", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840399207332, "ground_truth": 0}, {"key": "33131935", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145667631265, "ground_truth": 0}, {"key": "39021319", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804332616038, "ground_truth": 0}, {"key": "39021319", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39233683471261155, "ground_truth": 0}, {"key": "39021319", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6495786265718227, "ground_truth": 0}, {"key": "39021319", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760195782236, "ground_truth": 0}, {"key": "39021319", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4054487198859457, "ground_truth": 0}, {"key": "40644571", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5234203591034752, "ground_truth": 0}, {"key": "40644571", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5813030961831136, "ground_truth": 0}, {"key": "40644571", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46879063446770997, "ground_truth": 0}, {"key": "40644571", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262530453752, "ground_truth": 0}, {"key": "40644571", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647301469871, "ground_truth": 0}, {"key": "14681877", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9615338090978339, "ground_truth": 0}, {"key": "14681877", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9268352781122182, "ground_truth": 0}, {"key": "14681877", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9582261158377702, "ground_truth": 0}, {"key": "14681877", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9563089411318328, "ground_truth": 0}, {"key": "14681877", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531158150634, "ground_truth": 0}, {"key": "36570890", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804061747068, "ground_truth": 0}, {"key": "36570890", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.41679663931170996, "ground_truth": 0}, {"key": "36570890", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6495786382057275, "ground_truth": 0}, {"key": "36570890", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331483098891, "ground_truth": 0}, {"key": "36570890", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984069533524, "ground_truth": 0}, {"key": "30452755", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9289263309011815, "ground_truth": 0}, {"key": "30452755", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7918210875284468, "ground_truth": 0}, {"key": "30452755", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8539127500711846, "ground_truth": 0}, {"key": "30452755", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312092584815, "ground_truth": 0}, {"key": "30452755", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.771843492772291, "ground_truth": 0}, {"key": "37347053", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5136684582863542, "ground_truth": 0}, {"key": "37347053", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7356416332330015, "ground_truth": 0}, {"key": "37347053", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7295197598757143, "ground_truth": 0}, {"key": "37347053", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004048441419, "ground_truth": 0}, {"key": "37347053", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073678537308, "ground_truth": 0}, {"key": "38890979", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419796483687, "ground_truth": 0}, {"key": "38890979", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43398146258829534, "ground_truth": 0}, {"key": "38890979", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6113819813275609, "ground_truth": 0}, {"key": "38890979", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832233630976, "ground_truth": 0}, {"key": "38890979", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.38861802933959244, "ground_truth": 0}, {"key": "32974694", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7431680034963362, "ground_truth": 0}, {"key": "32974694", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8255897095842217, "ground_truth": 0}, {"key": "32974694", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6825737440639796, "ground_truth": 0}, {"key": "32974694", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325218701906, "ground_truth": 0}, {"key": "32974694", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185792439826, "ground_truth": 0}, {"key": "38519940", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8910549569998064, "ground_truth": 0}, {"key": "38519940", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8068526175064302, "ground_truth": 0}, {"key": "38519940", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.934395168230083, "ground_truth": 0}, {"key": "38519940", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9309620716594458, "ground_truth": 0}, {"key": "38519940", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510394733762, "ground_truth": 0}, {"key": "38870104", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8732148175012601, "ground_truth": 0}, {"key": "38870104", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8198933176767487, "ground_truth": 0}, {"key": "38870104", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8333245931982848, "ground_truth": 0}, {"key": "38870104", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240792767953, "ground_truth": 0}, {"key": "38870104", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894659249351, "ground_truth": 0}, {"key": "34283161", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "34283161", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5097643890025076, "ground_truth": 0}, {"key": "34283161", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5136684890295825, "ground_truth": 0}, {"key": "34283161", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030858205992, "ground_truth": 0}, {"key": "34283161", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922079192124267, "ground_truth": 0}, {"key": "31650463", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6740504795882462, "ground_truth": 0}, {"key": "31650463", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8902942264864173, "ground_truth": 0}, {"key": "31650463", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7520125812351427, "ground_truth": 0}, {"key": "31650463", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743789961919, "ground_truth": 0}, {"key": "31650463", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740322863475, "ground_truth": 0}, {"key": "35589432", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8365545571600665, "ground_truth": 0}, {"key": "35589432", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544222958683, "ground_truth": 0}, {"key": "35589432", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6943026910886322, "ground_truth": 0}, {"key": "35589432", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314750650344, "ground_truth": 0}, {"key": "35589432", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.844921507958257, "ground_truth": 0}, {"key": "14412752", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7943849738758545, "ground_truth": 0}, {"key": "14412752", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7620701116074622, "ground_truth": 0}, {"key": "14412752", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7534666495782403, "ground_truth": 0}, {"key": "14412752", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321910606786, "ground_truth": 0}, {"key": "14412752", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283036976835, "ground_truth": 0}, {"key": "37271183", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9629528269700959, "ground_truth": 0}, {"key": "37271183", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9764905475483305, "ground_truth": 0}, {"key": "37271183", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9780517493140406, "ground_truth": 0}, {"key": "37271183", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9750122045928604, "ground_truth": 0}, {"key": "37271183", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9763105282272024, "ground_truth": 0}, {"key": "35588153", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9496693678732939, "ground_truth": 0}, {"key": "35588153", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9575961708741283, "ground_truth": 0}, {"key": "35588153", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9086178921518454, "ground_truth": 0}, {"key": "35588153", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9433475814894846, "ground_truth": 0}, {"key": "35588153", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9390248138304871, "ground_truth": 0}, {"key": "39876692", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8397339709491372, "ground_truth": 0}, {"key": "39876692", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8428631553339347, "ground_truth": 0}, {"key": "39876692", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8267117993867211, "ground_truth": 0}, {"key": "39876692", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672289626046, "ground_truth": 0}, {"key": "39876692", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619324240545, "ground_truth": 0}, {"key": "38992323", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8255897260032025, "ground_truth": 0}, {"key": "38992323", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7676898702903411, "ground_truth": 0}, {"key": "38992323", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8688267905086287, "ground_truth": 0}, {"key": "38992323", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928954000118, "ground_truth": 0}, {"key": "38992323", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531122221307, "ground_truth": 0}, {"key": "37556002", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7592254011940057, "ground_truth": 0}, {"key": "37556002", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.677474026747477, "ground_truth": 0}, {"key": "37556002", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8529354907291411, "ground_truth": 0}, {"key": "37556002", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056350414707, "ground_truth": 0}, {"key": "37556002", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850470176137, "ground_truth": 0}, {"key": "39875801", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8333245801839786, "ground_truth": 0}, {"key": "39875801", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8311430532531962, "ground_truth": 0}, {"key": "39875801", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8267117968446093, "ground_truth": 0}, {"key": "39875801", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745013923066, "ground_truth": 0}, {"key": "39875801", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346103747068, "ground_truth": 0}, {"key": "39272285", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33807713235481435, "ground_truth": 0}, {"key": "39272285", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.1112412186561143, "ground_truth": 0}, {"key": "39272285", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1835936372752246, "ground_truth": 0}, {"key": "39272285", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921741125679567, "ground_truth": 0}, {"key": "39272285", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.19436781098855735, "ground_truth": 0}, {"key": "39629714", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7341195260819899, "ground_truth": 0}, {"key": "39629714", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6619228646542069, "ground_truth": 0}, {"key": "39629714", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4493926490182048, "ground_truth": 0}, {"key": "39629714", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306316653629, "ground_truth": 0}, {"key": "39629714", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.685949425682712, "ground_truth": 0}, {"key": "34043257", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7606506327905336, "ground_truth": 0}, {"key": "34043257", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6740504749886853, "ground_truth": 0}, {"key": "34043257", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8774767844615241, "ground_truth": 0}, {"key": "34043257", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625240675076, "ground_truth": 0}, {"key": "34043257", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210733758314, "ground_truth": 0}, {"key": "33995240", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3665897475809363, "ground_truth": 0}, {"key": "33995240", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5273165326115731, "ground_truth": 0}, {"key": "33995240", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.66017238648719, "ground_truth": 0}, {"key": "33995240", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755879915904321, "ground_truth": 0}, {"key": "33995240", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185291688371, "ground_truth": 0}, {"key": "39399948", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9092645171623509, "ground_truth": 0}, {"key": "39399948", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7461389908790237, "ground_truth": 0}, {"key": "39399948", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9039745071400547, "ground_truth": 0}, {"key": "39399948", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527866413096, "ground_truth": 0}, {"key": "39399948", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933362833042, "ground_truth": 0}, {"key": "33185890", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5717665936335762, "ground_truth": 0}, {"key": "33185890", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7648916220185514, "ground_truth": 0}, {"key": "33185890", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575767130243, "ground_truth": 0}, {"key": "33185890", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640252500042, "ground_truth": 0}, {"key": "33185890", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178993097795, "ground_truth": 0}, {"key": "35280425", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8210441007572189, "ground_truth": 0}, {"key": "35280425", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8807970841255953, "ground_truth": 0}, {"key": "35280425", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.852935466104463, "ground_truth": 0}, {"key": "35280425", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9348724449588194, "ground_truth": 0}, {"key": "35280425", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424474471045, "ground_truth": 0}, {"key": "16365170", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9299510473826771, "ground_truth": 0}, {"key": "16365170", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9299510440496618, "ground_truth": 0}, {"key": "16365170", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8991213779679594, "ground_truth": 0}, {"key": "16365170", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357639879935, "ground_truth": 0}, {"key": "16365170", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9343951597346705, "ground_truth": 0}, {"key": "24388238", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6039318335501443, "ground_truth": 0}, {"key": "24388238", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7786493172148371, "ground_truth": 0}, {"key": "24388238", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5602526441341927, "ground_truth": 0}, {"key": "24388238", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191701318201, "ground_truth": 0}, {"key": "24388238", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740190608095, "ground_truth": 0}, {"key": "35024827", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7248702953039464, "ground_truth": 0}, {"key": "35024827", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6976089142466793, "ground_truth": 0}, {"key": "35024827", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8255897177723265, "ground_truth": 0}, {"key": "35024827", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581650576821, "ground_truth": 0}, {"key": "35024827", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796269809701, "ground_truth": 0}, {"key": "38624944", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8539127455902632, "ground_truth": 0}, {"key": "38624944", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7704647888891853, "ground_truth": 0}, {"key": "38624944", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6001883608037158, "ground_truth": 0}, {"key": "38624944", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416362390922, "ground_truth": 0}, {"key": "38624944", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.811676014388792, "ground_truth": 0}, {"key": "34719830", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.831143039997504, "ground_truth": 0}, {"key": "34719830", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9319595830436759, "ground_truth": 0}, {"key": "34719830", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9005297878435816, "ground_truth": 0}, {"key": "34719830", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277953085674, "ground_truth": 0}, {"key": "34719830", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104469980933, "ground_truth": 0}, {"key": "38995225", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46295865479098514, "ground_truth": 0}, {"key": "38995225", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6584175093964341, "ground_truth": 0}, {"key": "38995225", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4726834477270254, "ground_truth": 0}, {"key": "38995225", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.44167302683686255, "ground_truth": 0}, {"key": "38995225", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982764312754804, "ground_truth": 0}, {"key": "34242311", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7401743693891033, "ground_truth": 0}, {"key": "34242311", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7431680300970384, "ground_truth": 0}, {"key": "34242311", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8428631473649778, "ground_truth": 0}, {"key": "34242311", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445522617346, "ground_truth": 0}, {"key": "34242311", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354781906481, "ground_truth": 0}, {"key": "39253748", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7994423236615589, "ground_truth": 0}, {"key": "39253748", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7879312034837137, "ground_truth": 0}, {"key": "39253748", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8606036341213106, "ground_truth": 0}, {"key": "39253748", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473754656182, "ground_truth": 0}, {"key": "39253748", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928967529893, "ground_truth": 0}, {"key": "37131104", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9899086844737466, "ground_truth": 0}, {"key": "37131104", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9973060859479976, "ground_truth": 0}, {"key": "37131104", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9917484019535098, "ground_truth": 0}, {"key": "37131104", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9899086849953641, "ground_truth": 0}, {"key": "37131104", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.99224446295886, "ground_truth": 0}, {"key": "38490554", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8128673080320142, "ground_truth": 0}, {"key": "38490554", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8244619343088111, "ground_truth": 0}, {"key": "38490554", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9496693641121541, "ground_truth": 0}, {"key": "38490554", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9635062366424092, "ground_truth": 0}, {"key": "38490554", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583374192767, "ground_truth": 0}, {"key": "29009500", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4054487197751252, "ground_truth": 0}, {"key": "29009500", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.37754064944194093, "ground_truth": 0}, {"key": "29009500", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4474602735573713, "ground_truth": 0}, {"key": "29009500", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48438010067552034, "ground_truth": 0}, {"key": "29009500", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285229328344673, "ground_truth": 0}, {"key": "36703057", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5813031049642148, "ground_truth": 0}, {"key": "36703057", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6893056140310667, "ground_truth": 0}, {"key": "36703057", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.754914966233317, "ground_truth": 0}, {"key": "36703057", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624886589486, "ground_truth": 0}, {"key": "36703057", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256069086794, "ground_truth": 0}, {"key": "34876987", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.931462510847349, "ground_truth": 0}, {"key": "34876987", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9278877931419104, "ground_truth": 0}, {"key": "34876987", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8991213619252965, "ground_truth": 0}, {"key": "34876987", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297814938502, "ground_truth": 0}, {"key": "34876987", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531240306028, "ground_truth": 0}, {"key": "36209258", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8152324835254912, "ground_truth": 0}, {"key": "36209258", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9124361636261265, "ground_truth": 0}, {"key": "36209258", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7956581160820492, "ground_truth": 0}, {"key": "36209258", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.825589710298355, "ground_truth": 0}, {"key": "36209258", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199650689902, "ground_truth": 0}, {"key": "36854437", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2365162226637815, "ground_truth": 0}, {"key": "36854437", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2766905245772006, "ground_truth": 0}, {"key": "36854437", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3539862799538839, "ground_truth": 0}, {"key": "36854437", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285231628288425, "ground_truth": 0}, {"key": "36854437", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2450850046515572, "ground_truth": 0}, {"key": "38047723", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.21469142597190707, "ground_truth": 0}, {"key": "38047723", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.20055768338541544, "ground_truth": 0}, {"key": "38047723", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2133771701575424, "ground_truth": 0}, {"key": "38047723", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436781125964037, "ground_truth": 0}, {"key": "38047723", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594721340344544, "ground_truth": 0}, {"key": "34287816", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6671477051955459, "ground_truth": 0}, {"key": "34287816", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.661922878280236, "ground_truth": 0}, {"key": "34287816", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7416740165451295, "ground_truth": 0}, {"key": "34287816", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118739737122, "ground_truth": 0}, {"key": "34287816", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702834890527, "ground_truth": 0}, {"key": "33235855", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9504109804668152, "ground_truth": 0}, {"key": "33235855", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.955981347704751, "ground_truth": 0}, {"key": "33235855", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9738443826432401, "ground_truth": 0}, {"key": "33235855", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9757623644911525, "ground_truth": 0}, {"key": "33235855", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9353465192928891, "ground_truth": 0}, {"key": "34381016", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.750552754730631, "ground_truth": 0}, {"key": "34381016", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.848972206721181, "ground_truth": 0}, {"key": "34381016", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7401743529462448, "ground_truth": 0}, {"key": "34381016", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673296967915, "ground_truth": 0}, {"key": "34381016", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884635107683, "ground_truth": 0}, {"key": "28064995", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5794004172150028, "ground_truth": 0}, {"key": "28064995", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.718594402871202, "ground_truth": 0}, {"key": "28064995", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6334102616027542, "ground_truth": 0}, {"key": "28064995", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918558856568, "ground_truth": 0}, {"key": "28064995", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073661487573987, "ground_truth": 0}, {"key": "37576197", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.17781087762260775, "ground_truth": 0}, {"key": "37576197", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40733340261567486, "ground_truth": 0}, {"key": "37576197", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41679662912459114, "ground_truth": 0}, {"key": "37576197", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4225046280623098, "ground_truth": 0}, {"key": "37576197", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2598256401038203, "ground_truth": 0}, {"key": "34454741", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4882833815550605, "ground_truth": 0}, {"key": "34454741", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4416730055605998, "ground_truth": 0}, {"key": "34454741", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5195213352822715, "ground_truth": 0}, {"key": "34454741", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708733530078, "ground_truth": 0}, {"key": "34454741", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4551986039444893, "ground_truth": 0}, {"key": "34766970", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.544801375088027, "ground_truth": 0}, {"key": "34766970", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35398630106662204, "ground_truth": 0}, {"key": "34766970", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.27982849441698904, "ground_truth": 0}, {"key": "34766970", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974735160165845, "ground_truth": 0}, {"key": "34766970", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237258966692, "ground_truth": 0}, {"key": "35574186", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8615382084271727, "ground_truth": 0}, {"key": "35574186", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7386690638697904, "ground_truth": 0}, {"key": "35574186", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9012274192233923, "ground_truth": 0}, {"key": "35574186", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110404517462, "ground_truth": 0}, {"key": "35574186", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920141740677, "ground_truth": 0}, {"key": "35486470", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6132365565982263, "ground_truth": 0}, {"key": "35486470", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.517570892607997, "ground_truth": 0}, {"key": "35486470", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6636689472613373, "ground_truth": 0}, {"key": "35486470", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026686304234, "ground_truth": 0}, {"key": "35486470", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633503494163, "ground_truth": 0}, {"key": "40977702", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41111087444193906, "ground_truth": 0}, {"key": "40977702", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6688802595873968, "ground_truth": 0}, {"key": "40977702", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7233094757341293, "ground_truth": 0}, {"key": "40977702", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199190769712, "ground_truth": 0}, {"key": "40977702", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684648544135, "ground_truth": 0}, {"key": "35336618", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9190632827180215, "ground_truth": 0}, {"key": "35336618", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8386797669108776, "ground_truth": 0}, {"key": "35336618", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9433475753019028, "ground_truth": 0}, {"key": "35336618", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970760241259, "ground_truth": 0}, {"key": "35336618", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9412234354576479, "ground_truth": 0}, {"key": "33024679", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6495786367247658, "ground_truth": 0}, {"key": "33024679", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.67060828459369, "ground_truth": 0}, {"key": "33024679", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8056321829686793, "ground_truth": 0}, {"key": "33024679", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640262736437, "ground_truth": 0}, {"key": "33024679", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494525695164, "ground_truth": 0}, {"key": "37451334", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419842665182, "ground_truth": 0}, {"key": "37451334", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.727975458815559, "ground_truth": 0}, {"key": "37451334", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8479677639089133, "ground_truth": 0}, {"key": "37451334", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549581607162, "ground_truth": 0}, {"key": "37451334", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.791821081669376, "ground_truth": 0}, {"key": "33354824", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5097644122632813, "ground_truth": 0}, {"key": "33354824", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "33354824", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43014733505473335, "ground_truth": 0}, {"key": "33354824", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.29259528173004135, "ground_truth": 0}, {"key": "33354824", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.366589710284963, "ground_truth": 0}, {"key": "34688538", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7371581608959635, "ground_truth": 0}, {"key": "34688538", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7799929114555342, "ground_truth": 0}, {"key": "34688538", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6992544006640118, "ground_truth": 0}, {"key": "34688538", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316972081962, "ground_truth": 0}, {"key": "34688538", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118984655264, "ground_truth": 0}, {"key": "33646276", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3056973344761743, "ground_truth": 0}, {"key": "33646276", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3904758394239726, "ground_truth": 0}, {"key": "33646276", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3276683152394597, "ground_truth": 0}, {"key": "33646276", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404166015525164, "ground_truth": 0}, {"key": "33646276", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.46490158237657103, "ground_truth": 0}, {"key": "40322608", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9207896796681941, "ground_truth": 0}, {"key": "40322608", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9118099538503416, "ground_truth": 0}, {"key": "40322608", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9178933713006906, "ground_truth": 0}, {"key": "40322608", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.853912752933086, "ground_truth": 0}, {"key": "40322608", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377795034418, "ground_truth": 0}, {"key": "39565762", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9059898208562763, "ground_truth": 0}, {"key": "39565762", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8962513709368065, "ground_truth": 0}, {"key": "39565762", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7476159508029006, "ground_truth": 0}, {"key": "39565762", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673129353325, "ground_truth": 0}, {"key": "39565762", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772332518516, "ground_truth": 0}, {"key": "30534259", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746054204059, "ground_truth": 0}, {"key": "30534259", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6460136766281023, "ground_truth": 0}, {"key": "30534259", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085728628225, "ground_truth": 0}, {"key": "30534259", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210675399185, "ground_truth": 0}, {"key": "30534259", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.554470466301206, "ground_truth": 0}, {"key": "39644242", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8705972646159874, "ground_truth": 0}, {"key": "39644242", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7233094639182371, "ground_truth": 0}, {"key": "39644242", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.835483536936381, "ground_truth": 0}, {"key": "39644242", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744650649637, "ground_truth": 0}, {"key": "39644242", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.817574478721977, "ground_truth": 0}, {"key": "19853740", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6076631573189969, "ground_truth": 0}, {"key": "19853740", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8044059098397027, "ground_truth": 0}, {"key": "19853740", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.816406385162424, "ground_truth": 0}, {"key": "19853740", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.82218912534965, "ground_truth": 0}, {"key": "19853740", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.774583373348791, "ground_truth": 0}, {"key": "33023078", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8824278695710662, "ground_truth": 0}, {"key": "33023078", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8489721947149015, "ground_truth": 0}, {"key": "33023078", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8300437766967231, "ground_truth": 0}, {"key": "33023078", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972590766985, "ground_truth": 0}, {"key": "33023078", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303263201608, "ground_truth": 0}, {"key": "38329806", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44552953440891857, "ground_truth": 0}, {"key": "38329806", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3007455853475687, "ground_truth": 0}, {"key": "38329806", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984714207629, "ground_truth": 0}, {"key": "38329806", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974731199685874, "ground_truth": 0}, {"key": "38329806", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.435901503103288, "ground_truth": 0}, {"key": "38761942", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4960938587606593, "ground_truth": 0}, {"key": "38761942", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5736784217281456, "ground_truth": 0}, {"key": "38761942", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3793783966408914, "ground_truth": 0}, {"key": "38761942", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552952496438036, "ground_truth": 0}, {"key": "38761942", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058590977805998, "ground_truth": 0}, {"key": "33773576", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802730621884, "ground_truth": 0}, {"key": "33773576", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.680878612003705, "ground_truth": 0}, {"key": "33773576", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7106282882373711, "ground_truth": 0}, {"key": "33773576", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4707366058123672, "ground_truth": 0}, {"key": "33773576", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197877137727, "ground_truth": 0}, {"key": "37642631", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7620701192534687, "ground_truth": 0}, {"key": "37642631", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8116760259966475, "ground_truth": 0}, {"key": "37642631", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6495786210947665, "ground_truth": 0}, {"key": "37642631", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688190166401, "ground_truth": 0}, {"key": "37642631", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706083169365519, "ground_truth": 0}, {"key": "36609836", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802610448533, "ground_truth": 0}, {"key": "36609836", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7866228400469362, "ground_truth": 0}, {"key": "36609836", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9161096140937479, "ground_truth": 0}, {"key": "36609836", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867911798576, "ground_truth": 0}, {"key": "36609836", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531115832437, "ground_truth": 0}, {"key": "41035610", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7074047252050819, "ground_truth": 0}, {"key": "41035610", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6513548681466778, "ground_truth": 0}, {"key": "41035610", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5717666129970279, "ground_truth": 0}, {"key": "41035610", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506574113007, "ground_truth": 0}, {"key": "41035610", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872257267625, "ground_truth": 0}, {"key": "37592684", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7866228090717222, "ground_truth": 0}, {"key": "37592684", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.801935827011587, "ground_truth": 0}, {"key": "37592684", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8244619237584375, "ground_truth": 0}, {"key": "37592684", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377713594698, "ground_truth": 0}, {"key": "37592684", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675412278033, "ground_truth": 0}, {"key": "38951040", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.823328383307658, "ground_truth": 0}, {"key": "38951040", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7025300626261048, "ground_truth": 0}, {"key": "38951040", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8376199681918483, "ground_truth": 0}, {"key": "38951040", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646053129039, "ground_truth": 0}, {"key": "38951040", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358120133743, "ground_truth": 0}, {"key": "40774469", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.08756384482106228, "ground_truth": 0}, {"key": "40774469", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.1393963910552885, "ground_truth": 0}, {"key": "40774469", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.48633150793370106, "ground_truth": 0}, {"key": "40774469", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064641415784, "ground_truth": 0}, {"key": "40774469", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.29583984530284346, "ground_truth": 0}, {"key": "40876288", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8128673275971685, "ground_truth": 0}, {"key": "40876288", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8479677572458219, "ground_truth": 0}, {"key": "40876288", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5234203483704415, "ground_truth": 0}, {"key": "40876288", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757645951144077, "ground_truth": 0}, {"key": "40876288", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708887841441, "ground_truth": 0}, {"key": "40340131", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8006919996157325, "ground_truth": 0}, {"key": "40340131", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8887587989856897, "ground_truth": 0}, {"key": "40340131", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8469578344408782, "ground_truth": 0}, {"key": "40340131", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148394836692, "ground_truth": 0}, {"key": "40340131", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045917113017, "ground_truth": 0}, {"key": "30121591", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7745833913123409, "ground_truth": 0}, {"key": "30121591", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085733075136, "ground_truth": 0}, {"key": "30121591", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583269853277212, "ground_truth": 0}, {"key": "30121591", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333245814230607, "ground_truth": 0}, {"key": "30121591", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085791590259, "ground_truth": 0}, {"key": "35623366", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8606036129983979, "ground_truth": 0}, {"key": "35623366", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6279512148177195, "ground_truth": 0}, {"key": "35623366", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8006919987356041, "ground_truth": 0}, {"key": "35623366", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.760650630286765, "ground_truth": 0}, {"key": "35623366", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849722488766, "ground_truth": 0}, {"key": "41014093", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7592253965435665, "ground_truth": 0}, {"key": "41014093", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6334102706677611, "ground_truth": 0}, {"key": "41014093", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7248702778438116, "ground_truth": 0}, {"key": "41014093", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982302565559, "ground_truth": 0}, {"key": "41014093", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127539883287, "ground_truth": 0}, {"key": "11387984", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7401743762995111, "ground_truth": 0}, {"key": "11387984", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5312093754448184, "ground_truth": 0}, {"key": "11387984", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8816148982336901, "ground_truth": 0}, {"key": "11387984", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825924376915, "ground_truth": 0}, {"key": "11387984", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059075038161, "ground_truth": 0}, {"key": "39508312", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8116760273942741, "ground_truth": 0}, {"key": "39508312", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6315943054056574, "ground_truth": 0}, {"key": "39508312", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6584174899352585, "ground_truth": 0}, {"key": "39508312", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.754914968527606, "ground_truth": 0}, {"key": "39508312", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.732591847971668, "ground_truth": 0}, {"key": "35815369", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7759445349536117, "ground_truth": 0}, {"key": "35815369", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5660185020723164, "ground_truth": 0}, {"key": "35815369", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.740174380762753, "ground_truth": 0}, {"key": "35815369", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880096821427, "ground_truth": 0}, {"key": "35815369", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4785288593967034, "ground_truth": 0}, {"key": "35802823", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5698526324269177, "ground_truth": 0}, {"key": "35802823", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.616935830121752, "ground_truth": 0}, {"key": "35802823", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6825737055649416, "ground_truth": 0}, {"key": "35802823", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864511273893134, "ground_truth": 0}, {"key": "35802823", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672036594309, "ground_truth": 0}, {"key": "38499968", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8128673033352831, "ground_truth": 0}, {"key": "38499968", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7577943703821951, "ground_truth": 0}, {"key": "38499968", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7431680150497814, "ground_truth": 0}, {"key": "38499968", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321783411428, "ground_truth": 0}, {"key": "38499968", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467656507022, "ground_truth": 0}, {"key": "36926726", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7490872306750896, "ground_truth": 0}, {"key": "36926726", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.779992913249595, "ground_truth": 0}, {"key": "36926726", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9136765318717601, "ground_truth": 0}, {"key": "36926726", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545660613259, "ground_truth": 0}, {"key": "36926726", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672147936524, "ground_truth": 0}, {"key": "40903712", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7879311951221041, "ground_truth": 0}, {"key": "40903712", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8407826015734362, "ground_truth": 0}, {"key": "40903712", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7520125536238207, "ground_truth": 0}, {"key": "40903712", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.823328403412674, "ground_truth": 0}, {"key": "40903712", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849721329269, "ground_truth": 0}, {"key": "19614862", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7826624868037055, "ground_truth": 0}, {"key": "19614862", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2766905308272933, "ground_truth": 0}, {"key": "19614862", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7931059655326105, "ground_truth": 0}, {"key": "19614862", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983121840048623, "ground_truth": 0}, {"key": "19614862", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297745992853687, "ground_truth": 0}, {"key": "38861704", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6001883263394998, "ground_truth": 0}, {"key": "38861704", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5679365869631834, "ground_truth": 0}, {"key": "38861704", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4726834667441891, "ground_truth": 0}, {"key": "38861704", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116311696203, "ground_truth": 0}, {"key": "38861704", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711921221278, "ground_truth": 0}, {"key": "34349607", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5078118738217131, "ground_truth": 0}, {"key": "34349607", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6261241502056387, "ground_truth": 0}, {"key": "34349607", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.35042136207808455, "ground_truth": 0}, {"key": "34349607", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.535098451718177, "ground_truth": 0}, {"key": "34349607", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591082420393, "ground_truth": 0}, {"key": "20773800", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1847675061962517, "ground_truth": 0}, {"key": "20773800", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.07263670705669714, "ground_truth": 0}, {"key": "20773800", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.10087862153143967, "ground_truth": 0}, {"key": "20773800", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.10818895614290329, "ground_truth": 0}, {"key": "20773800", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.08449275835798901, "ground_truth": 0}, {"key": "35545608", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6601723725135193, "ground_truth": 0}, {"key": "35545608", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40544874859840463, "ground_truth": 0}, {"key": "35545608", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6297746212944273, "ground_truth": 0}, {"key": "35545608", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291157432167, "ground_truth": 0}, {"key": "35545608", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688384976818, "ground_truth": 0}, {"key": "37258984", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5736784218588775, "ground_truth": 0}, {"key": "37258984", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3923368456442243, "ground_truth": 0}, {"key": "37258984", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5563995745806168, "ground_truth": 0}, {"key": "37258984", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995703037549, "ground_truth": 0}, {"key": "37258984", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268346928984584, "ground_truth": 0}, {"key": "37274562", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7606506558829824, "ground_truth": 0}, {"key": "37274562", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.70740469208703, "ground_truth": 0}, {"key": "37274562", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8832359822464031, "ground_truth": 0}, {"key": "37274562", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897128513501, "ground_truth": 0}, {"key": "37274562", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.744656336335064, "ground_truth": 0}, {"key": "40828068", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8697145837192317, "ground_truth": 0}, {"key": "40828068", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8044059286322829, "ground_truth": 0}, {"key": "40828068", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7122321590014795, "ground_truth": 0}, {"key": "40828068", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441047549788, "ground_truth": 0}, {"key": "40828068", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377781867648, "ground_truth": 0}, {"key": "37807180", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8092759788305403, "ground_truth": 0}, {"key": "37807180", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8019358285181458, "ground_truth": 0}, {"key": "37807180", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7106282912901184, "ground_truth": 0}, {"key": "37807180", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760164939655, "ground_truth": 0}, {"key": "37807180", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506585174209, "ground_truth": 0}, {"key": "40748607", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9700134931840098, "ground_truth": 0}, {"key": "40748607", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9862576798438122, "ground_truth": 0}, {"key": "40748607", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9848109512185282, "ground_truth": 0}, {"key": "40748607", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9759464461231806, "ground_truth": 0}, {"key": "40748607", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.984093608449807, "ground_truth": 0}, {"key": "40123819", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8969755657625894, "ground_truth": 0}, {"key": "40123819", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8459424390863844, "ground_truth": 0}, {"key": "40123819", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9130583467366609, "ground_truth": 0}, {"key": "40123819", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869798096608, "ground_truth": 0}, {"key": "40123819", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299589812458, "ground_truth": 0}, {"key": "38453867", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7690802241921765, "ground_truth": 0}, {"key": "38453867", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8080672282259382, "ground_truth": 0}, {"key": "38453867", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5774953684537438, "ground_truth": 0}, {"key": "38453867", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.773216357794563, "ground_truth": 0}, {"key": "38453867", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684562435022, "ground_truth": 0}, {"key": "38944856", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9420819121004503, "ground_truth": 0}, {"key": "38944856", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8969755687281433, "ground_truth": 0}, {"key": "38944856", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8469578388077991, "ground_truth": 0}, {"key": "38944856", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267738524648, "ground_truth": 0}, {"key": "38944856", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.764891614506584, "ground_truth": 0}, {"key": "35778898", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8723473676177314, "ground_truth": 0}, {"key": "35778898", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8947894562997437, "ground_truth": 0}, {"key": "35778898", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8376199614196427, "ground_truth": 0}, {"key": "35778898", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9372107953899682, "ground_truth": 0}, {"key": "35778898", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517181997477, "ground_truth": 0}, {"key": "32530125", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2094696932990392, "ground_truth": 0}, {"key": "32530125", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6132365514864817, "ground_truth": 0}, {"key": "32530125", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2829881279533823, "ground_truth": 0}, {"key": "32530125", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570645194383084, "ground_truth": 0}, {"key": "32530125", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2068940504776231, "ground_truth": 0}, {"key": "35010363", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5117165960188814, "ground_truth": 0}, {"key": "35010363", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3522017704965841, "ground_truth": 0}, {"key": "35010363", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5331544067290769, "ground_truth": 0}, {"key": "35010363", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804620030535, "ground_truth": 0}, {"key": "35010363", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947323958195, "ground_truth": 0}, {"key": "27514800", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7401743676733665, "ground_truth": 0}, {"key": "27514800", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8791467567961475, "ground_truth": 0}, {"key": "27514800", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9549844682391582, "ground_truth": 0}, {"key": "27514800", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.833324602227619, "ground_truth": 0}, {"key": "27514800", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215314975218, "ground_truth": 0}, {"key": "25725840", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1623800440396423, "ground_truth": 0}, {"key": "25725840", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.14608725216707225, "ground_truth": 0}, {"key": "25725840", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4513265107779444, "ground_truth": 0}, {"key": "25725840", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314738225143144, "ground_truth": 0}, {"key": "25725840", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508501905853058, "ground_truth": 0}, {"key": "38327225", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7217432094783331, "ground_truth": 0}, {"key": "38327225", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5350984264275451, "ground_truth": 0}, {"key": "38327225", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056513843554, "ground_truth": 0}, {"key": "38327225", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984142424885, "ground_truth": 0}, {"key": "38327225", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269320110985, "ground_truth": 0}, {"key": "11991724", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.890294228842437, "ground_truth": 0}, {"key": "11991724", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8080672081531065, "ground_truth": 0}, {"key": "11991724", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9569571494234522, "ground_truth": 0}, {"key": "11991724", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.926835277532162, "ground_truth": 0}, {"key": "11991724", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549552030245, "ground_truth": 0}, {"key": "32217545", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8068526025594047, "ground_truth": 0}, {"key": "32217545", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8128673196054911, "ground_truth": 0}, {"key": "32217545", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7201715092101426, "ground_truth": 0}, {"key": "32217545", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.817574483107491, "ground_truth": 0}, {"key": "32217545", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.750552764842723, "ground_truth": 0}, {"key": "12731847", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5117166193709488, "ground_truth": 0}, {"key": "12731847", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791786842027323, "ground_truth": 0}, {"key": "12731847", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.474631177480775, "ground_truth": 0}, {"key": "12731847", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632161286606524, "ground_truth": 0}, {"key": "12731847", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251164103203, "ground_truth": 0}, {"key": "36827234", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8333245960446699, "ground_truth": 0}, {"key": "36827234", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8140528092288483, "ground_truth": 0}, {"key": "36827234", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8714748561807326, "ground_truth": 0}, {"key": "36827234", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767784434562, "ground_truth": 0}, {"key": "36827234", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675332393672, "ground_truth": 0}, {"key": "29111539", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7534666639452371, "ground_truth": 0}, {"key": "29111539", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8539127517154875, "ground_truth": 0}, {"key": "29111539", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8386797692819654, "ground_truth": 0}, {"key": "29111539", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163818765112, "ground_truth": 0}, {"key": "29111539", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647091634344, "ground_truth": 0}, {"key": "37763052", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7718434963544492, "ground_truth": 0}, {"key": "37763052", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7295197804082052, "ground_truth": 0}, {"key": "37763052", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8333246068193048, "ground_truth": 0}, {"key": "37763052", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.808067187950065, "ground_truth": 0}, {"key": "37763052", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867804490359, "ground_truth": 0}, {"key": "30682335", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199102231321, "ground_truth": 0}, {"key": "30682335", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5544704590410228, "ground_truth": 0}, {"key": "30682335", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5350984348883258, "ground_truth": 0}, {"key": "30682335", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883618031087, "ground_truth": 0}, {"key": "30682335", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984701860297, "ground_truth": 0}, {"key": "12261276", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.052618956199126196, "ground_truth": 0}, {"key": "12261276", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2213506917937318, "ground_truth": 0}, {"key": "12261276", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.07477004462625671, "ground_truth": 0}, {"key": "12261276", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.06560482882096733, "ground_truth": 0}, {"key": "12261276", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.13568954691496118, "ground_truth": 0}, {"key": "36912979", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.505859094594499, "ground_truth": 0}, {"key": "36912979", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4649015801010284, "ground_truth": 0}, {"key": "36912979", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2735743928108671, "ground_truth": 0}, {"key": "36912979", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116472354050816, "ground_truth": 0}, {"key": "36912979", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629585905025101, "ground_truth": 0}, {"key": "30205259", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8267117879227083, "ground_truth": 0}, {"key": "30205259", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8116759998345467, "ground_truth": 0}, {"key": "30205259", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9032942044237726, "ground_truth": 0}, {"key": "30205259", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122951856613, "ground_truth": 0}, {"key": "30205259", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215219064228, "ground_truth": 0}, {"key": "39458032", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9788748067404421, "ground_truth": 0}, {"key": "39458032", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9750122039967933, "ground_truth": 0}, {"key": "39458032", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9420819116699918, "ground_truth": 0}, {"key": "39458032", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505492720586, "ground_truth": 0}, {"key": "39458032", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.960062689330367, "ground_truth": 0}, {"key": "35116452", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.12168575133351282, "ground_truth": 0}, {"key": "35116452", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35577488578707, "ground_truth": 0}, {"key": "35116452", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30404168208111093, "ground_truth": 0}, {"key": "35116452", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270014129963733, "ground_truth": 0}, {"key": "35116452", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569734258134634, "ground_truth": 0}, {"key": "40107476", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8289387934089224, "ground_truth": 0}, {"key": "40107476", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8918110495488282, "ground_truth": 0}, {"key": "40107476", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7690802261569062, "ground_truth": 0}, {"key": "40107476", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099567974312, "ground_truth": 0}, {"key": "40107476", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527928368005, "ground_truth": 0}, {"key": "39501049", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9511422198494847, "ground_truth": 0}, {"key": "39501049", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9465966700235536, "ground_truth": 0}, {"key": "39501049", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9481545340775479, "ground_truth": 0}, {"key": "39501049", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9615338085366913, "ground_truth": 0}, {"key": "39501049", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510371062729, "ground_truth": 0}, {"key": "39642178", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5039061749666282, "ground_truth": 0}, {"key": "39642178", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5156199025860401, "ground_truth": 0}, {"key": "39642178", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.315735988733599, "ground_truth": 0}, {"key": "39642178", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166218869577, "ground_truth": 0}, {"key": "39642178", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315329002321, "ground_truth": 0}, {"key": "38024796", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2658804542497374, "ground_truth": 0}, {"key": "38024796", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2613309093147987, "ground_truth": 0}, {"key": "38024796", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.17895589544592894, "ground_truth": 0}, {"key": "38024796", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.17781086683721, "ground_truth": 0}, {"key": "38024796", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1167640173840407, "ground_truth": 0}, {"key": "36652079", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.667147686233845, "ground_truth": 0}, {"key": "36652079", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7620701050024435, "ground_truth": 0}, {"key": "36652079", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.682573756539455, "ground_truth": 0}, {"key": "36652079", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526360158872, "ground_truth": 0}, {"key": "36652079", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947517773606, "ground_truth": 0}, {"key": "32193402", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8568122974138802, "ground_truth": 0}, {"key": "32193402", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7505527544831125, "ground_truth": 0}, {"key": "32193402", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9079671360652704, "ground_truth": 0}, {"key": "32193402", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9399133529527169, "ground_truth": 0}, {"key": "32193402", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105570644576, "ground_truth": 0}, {"key": "32589706", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.767689846120513, "ground_truth": 0}, {"key": "32589706", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8661325012333851, "ground_truth": 0}, {"key": "32589706", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6601723847402956, "ground_truth": 0}, {"key": "32589706", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306259641363, "ground_truth": 0}, {"key": "32589706", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148226265609, "ground_truth": 0}, {"key": "38590589", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8499711757406119, "ground_truth": 0}, {"key": "38590589", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8705972684773055, "ground_truth": 0}, {"key": "38590589", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7969253758373388, "ground_truth": 0}, {"key": "38590589", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346140745838, "ground_truth": 0}, {"key": "38590589", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673240421362, "ground_truth": 0}, {"key": "37045414", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9860442893818344, "ground_truth": 0}, {"key": "37045414", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.972830767372553, "ground_truth": 0}, {"key": "37045414", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.979195509835576, "ground_truth": 0}, {"key": "37045414", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9833429604768593, "ground_truth": 0}, {"key": "37045414", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9853843315448626, "ground_truth": 0}, {"key": "33310095", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9149009607609575, "ground_truth": 0}, {"key": "33310095", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7662936553865218, "ground_truth": 0}, {"key": "33310095", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7416740198449004, "ground_truth": 0}, {"key": "33310095", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414785181847, "ground_truth": 0}, {"key": "33310095", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267118006400587, "ground_truth": 0}, {"key": "37934604", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9059898187132115, "ground_truth": 0}, {"key": "37934604", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42823339594019577, "ground_truth": 0}, {"key": "37934604", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9167080806322044, "ground_truth": 0}, {"key": "37934604", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343680126273, "ground_truth": 0}, {"key": "37934604", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.894789463606044, "ground_truth": 0}, {"key": "39012181", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9916195463782759, "ground_truth": 0}, {"key": "39012181", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9906599752036415, "ground_truth": 0}, {"key": "39012181", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9894295124305889, "ground_truth": 0}, {"key": "39012181", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9860442889583957, "ground_truth": 0}, {"key": "39012181", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.990140144856802, "ground_truth": 0}, {"key": "40221674", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9778834101301361, "ground_truth": 0}, {"key": "40221674", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9372107899044457, "ground_truth": 0}, {"key": "40221674", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9822877019568329, "ground_truth": 0}, {"key": "40221674", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9618217247912824, "ground_truth": 0}, {"key": "40221674", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9492946353873456, "ground_truth": 0}, {"key": "36884862", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031737906554659, "ground_truth": 0}, {"key": "36884862", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.91305834134973, "ground_truth": 0}, {"key": "36884862", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8428631403988709, "ground_truth": 0}, {"key": "36884862", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195272986812, "ground_truth": 0}, {"key": "36884862", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063896504083, "ground_truth": 0}, {"key": "39054429", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6224593230352551, "ground_truth": 0}, {"key": "39054429", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7401743631574914, "ground_truth": 0}, {"key": "39054429", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41111087619638675, "ground_truth": 0}, {"key": "39054429", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684557342075556, "ground_truth": 0}, {"key": "39054429", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684559825354893, "ground_truth": 0}, {"key": "36753964", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.21601153778745474, "ground_truth": 0}, {"key": "36753964", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3007455955134126, "ground_truth": 0}, {"key": "36753964", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40168783688165594, "ground_truth": 0}, {"key": "36753964", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634520361742, "ground_truth": 0}, {"key": "36753964", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748955332719, "ground_truth": 0}, {"key": "37612459", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7969253762903512, "ground_truth": 0}, {"key": "37612459", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7759445563387458, "ground_truth": 0}, {"key": "37612459", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365708758218, "ground_truth": 0}, {"key": "37612459", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593314826274, "ground_truth": 0}, {"key": "37612459", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743490209721, "ground_truth": 0}, {"key": "36805789", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7057850185992919, "ground_truth": 0}, {"key": "36805789", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8955226828977638, "ground_truth": 0}, {"key": "36805789", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8031737868632897, "ground_truth": 0}, {"key": "36805789", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493134501823, "ground_truth": 0}, {"key": "36805789", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943856821084, "ground_truth": 0}, {"key": "12757394", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7138307861819462, "ground_truth": 0}, {"key": "12757394", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6825737291898938, "ground_truth": 0}, {"key": "12757394", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40168781919655805, "ground_truth": 0}, {"key": "12757394", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804786951087074, "ground_truth": 0}, {"key": "12757394", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711691209675, "ground_truth": 0}, {"key": "32192542", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9339146241017012, "ground_truth": 0}, {"key": "32192542", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9518632311459065, "ground_truth": 0}, {"key": "32192542", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9693242019066869, "ground_truth": 0}, {"key": "32192542", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.957277802773433, "ground_truth": 0}, {"key": "32192542", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9362850075423758, "ground_truth": 0}, {"key": "34856060", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5253688202320346, "ground_truth": 0}, {"key": "34856060", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.364777561124145, "ground_truth": 0}, {"key": "34856060", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292634041585592, "ground_truth": 0}, {"key": "34856060", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689364867965, "ground_truth": 0}, {"key": "34856060", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878129427193, "ground_truth": 0}, {"key": "36083416", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9161096077633252, "ground_truth": 0}, {"key": "36083416", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9304582626808471, "ground_truth": 0}, {"key": "36083416", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9092645136705952, "ground_truth": 0}, {"key": "36083416", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9173026492445244, "ground_truth": 0}, {"key": "36083416", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418270707344, "ground_truth": 0}, {"key": "33839050", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.509764374841075, "ground_truth": 0}, {"key": "33839050", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5660185636813667, "ground_truth": 0}, {"key": "33839050", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49023558610566437, "ground_truth": 0}, {"key": "33839050", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832493824114, "ground_truth": 0}, {"key": "33839050", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073334090135089, "ground_truth": 0}, {"key": "18464690", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6842640273055824, "ground_truth": 0}, {"key": "18464690", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5467381602838033, "ground_truth": 0}, {"key": "18464690", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6352224503768101, "ground_truth": 0}, {"key": "18464690", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413918532116, "ground_truth": 0}, {"key": "18464690", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937837883471814, "ground_truth": 0}, {"key": "39212665", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.26894142006376187, "ground_truth": 0}, {"key": "39212665", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4073334084247557, "ground_truth": 0}, {"key": "39212665", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.15304216224503212, "ground_truth": 0}, {"key": "39212665", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.27357439205150647, "ground_truth": 0}, {"key": "39212665", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559408659756347, "ground_truth": 0}, {"key": "40094011", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6959583290280246, "ground_truth": 0}, {"key": "40094011", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7549150034902172, "ground_truth": 0}, {"key": "40094011", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7866228151186379, "ground_truth": 0}, {"key": "40094011", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583161224845, "ground_truth": 0}, {"key": "40094011", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585632706307, "ground_truth": 0}, {"key": "36036272", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6774740143435696, "ground_truth": 0}, {"key": "36036272", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6842640271563188, "ground_truth": 0}, {"key": "36036272", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.45713673405853367, "ground_truth": 0}, {"key": "36036272", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324705190095, "ground_truth": 0}, {"key": "36036272", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631623263565, "ground_truth": 0}, {"key": "30681904", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3923368221944666, "ground_truth": 0}, {"key": "30681904", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6206216153372287, "ground_truth": 0}, {"key": "30681904", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.31405053358727464, "ground_truth": 0}, {"key": "30681904", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199343799956, "ground_truth": 0}, {"key": "30681904", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167988701339, "ground_truth": 0}, {"key": "27834240", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.24944725820103664, "ground_truth": 0}, {"key": "27834240", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.37937839559404074, "ground_truth": 0}, {"key": "27834240", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.15921740856498973, "ground_truth": 0}, {"key": "27834240", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2281565037542716, "ground_truth": 0}, {"key": "27834240", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1431877122584096, "ground_truth": 0}, {"key": "35025075", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4073334188551851, "ground_truth": 0}, {"key": "35025075", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6808786487067464, "ground_truth": 0}, {"key": "35025075", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4551985857919861, "ground_truth": 0}, {"key": "35025075", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118559495272, "ground_truth": 0}, {"key": "35025075", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102872094168, "ground_truth": 0}, {"key": "33316985", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.814052818673883, "ground_truth": 0}, {"key": "33316985", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6774740352198475, "ground_truth": 0}, {"key": "33316985", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228888207028, "ground_truth": 0}, {"key": "33316985", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303046519208, "ground_truth": 0}, {"key": "33316985", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416379576782, "ground_truth": 0}, {"key": "17037056", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3007455966542022, "ground_truth": 0}, {"key": "17037056", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4629586204341387, "ground_truth": 0}, {"key": "17037056", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4824290955557475, "ground_truth": 0}, {"key": "17037056", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022537804851285, "ground_truth": 0}, {"key": "17037056", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016878130078204, "ground_truth": 0}, {"key": "34050457", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6976089369018672, "ground_truth": 0}, {"key": "34050457", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8354835417173947, "ground_truth": 0}, {"key": "34050457", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9124361669263125, "ground_truth": 0}, {"key": "34050457", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288600099386, "ground_truth": 0}, {"key": "34050457", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228311931568, "ground_truth": 0}, {"key": "34713745", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41489883675459693, "ground_truth": 0}, {"key": "34713745", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4073334071373605, "ground_truth": 0}, {"key": "34713745", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47268350140996274, "ground_truth": 0}, {"key": "34713745", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735087869028, "ground_truth": 0}, {"key": "34713745", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014734057908893, "ground_truth": 0}, {"key": "40856210", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1151622308332997, "ground_truth": 0}, {"key": "40856210", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.12421301070256319, "ground_truth": 0}, {"key": "40856210", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.10158944317436636, "ground_truth": 0}, {"key": "40856210", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2494472522579211, "ground_truth": 0}, {"key": "40856210", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.10970578084245194, "ground_truth": 0}, {"key": "40848302", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8019358228099184, "ground_truth": 0}, {"key": "40848302", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8267117800647579, "ground_truth": 0}, {"key": "40848302", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8615382096885956, "ground_truth": 0}, {"key": "40848302", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.893309399143227, "ground_truth": 0}, {"key": "40848302", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905302918245457, "ground_truth": 0}, {"key": "40636168", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3904758515064528, "ground_truth": 0}, {"key": "40636168", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.435901536479221, "ground_truth": 0}, {"key": "40636168", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3647775643383072, "ground_truth": 0}, {"key": "40636168", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4186968926524207, "ground_truth": 0}, {"key": "40636168", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238750000173, "ground_truth": 0}, {"key": "34423311", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7341195320440695, "ground_truth": 0}, {"key": "34423311", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5964331354090111, "ground_truth": 0}, {"key": "34423311", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7866228077160152, "ground_truth": 0}, {"key": "34423311", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239896130704, "ground_truth": 0}, {"key": "34423311", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370307865122914, "ground_truth": 0}, {"key": "34833945", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9416541618192306, "ground_truth": 0}, {"key": "34833945", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9764905467211097, "ground_truth": 0}, {"key": "34833945", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9597620573970134, "ground_truth": 0}, {"key": "34833945", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9846936456955363, "ground_truth": 0}, {"key": "34833945", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9666631740863777, "ground_truth": 0}, {"key": "21272328", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2509127824342453, "ground_truth": 0}, {"key": "21272328", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7634837711607796, "ground_truth": 0}, {"key": "21272328", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4054487394836532, "ground_truth": 0}, {"key": "21272328", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882833842552233, "ground_truth": 0}, {"key": "21272328", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073659849249544, "ground_truth": 0}, {"key": "38648957", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36477755418146246, "ground_truth": 0}, {"key": "38648957", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.1710611792085841, "ground_truth": 0}, {"key": "38648957", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3451052765829062, "ground_truth": 0}, {"key": "38648957", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368311038878, "ground_truth": 0}, {"key": "38648957", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2281564982859195, "ground_truth": 0}, {"key": "24942981", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.22953520391808852, "ground_truth": 0}, {"key": "24942981", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.14128141957386867, "ground_truth": 0}, {"key": "24942981", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22135069391623424, "ground_truth": 0}, {"key": "24942981", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.12592276687588572, "ground_truth": 0}, {"key": "24942981", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2094697002006522, "ground_truth": 0}, {"key": "35882366", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.13206614447910195, "ground_truth": 0}, {"key": "35882366", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8519528100611733, "ground_truth": 0}, {"key": "35882366", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.15817435209411881, "ground_truth": 0}, {"key": "35882366", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.17328820520954097, "ground_truth": 0}, {"key": "35882366", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1744102755894471, "ground_truth": 0}, {"key": "40559523", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7295197750689949, "ground_truth": 0}, {"key": "40559523", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791787107870454, "ground_truth": 0}, {"key": "40559523", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704647763840322, "ground_truth": 0}, {"key": "40559523", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527944677072, "ground_truth": 0}, {"key": "40559523", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620700983278623, "ground_truth": 0}, {"key": "24632722", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6076631771500607, "ground_truth": 0}, {"key": "24632722", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4225046315317697, "ground_truth": 0}, {"key": "24632722", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39047586460724565, "ground_truth": 0}, {"key": "24632722", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367950136237, "ground_truth": 0}, {"key": "24632722", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786126497178, "ground_truth": 0}, {"key": "36002759", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224291445461, "ground_truth": 0}, {"key": "36002759", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5292634104776743, "ground_truth": 0}, {"key": "36002759", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6224593344531312, "ground_truth": 0}, {"key": "36002759", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101679954283464, "ground_truth": 0}, {"key": "36002759", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.598312199224359, "ground_truth": 0}, {"key": "29508534", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8006920060575119, "ground_truth": 0}, {"key": "29508534", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6315943064824288, "ground_truth": 0}, {"key": "29508534", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7185944015350598, "ground_truth": 0}, {"key": "29508534", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228265235055, "ground_truth": 0}, {"key": "29508534", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689485132409, "ground_truth": 0}, {"key": "15631612", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8848377795537374, "ground_truth": 0}, {"key": "15631612", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5214711680737782, "ground_truth": 0}, {"key": "15631612", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.874077235847728, "ground_truth": 0}, {"key": "15631612", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284066747393, "ground_truth": 0}, {"key": "15631612", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354943888242, "ground_truth": 0}, {"key": "40731892", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.13753246790909082, "ground_truth": 0}, {"key": "40731892", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.22405544957475884, "ground_truth": 0}, {"key": "40731892", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4016877825630927, "ground_truth": 0}, {"key": "40731892", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310404304665, "ground_truth": 0}, {"key": "40731892", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897525603769, "ground_truth": 0}, {"key": "35971910", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.787931193655659, "ground_truth": 0}, {"key": "35971910", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.888758791886661, "ground_truth": 0}, {"key": "35971910", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9073122174602003, "ground_truth": 0}, {"key": "35971910", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178981855229, "ground_truth": 0}, {"key": "35971910", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324904428606, "ground_truth": 0}, {"key": "34428424", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9740426419289883, "ground_truth": 0}, {"key": "34428424", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9511422222267588, "ground_truth": 0}, {"key": "34428424", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9773707967652955, "ground_truth": 0}, {"key": "34428424", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9690910400682495, "ground_truth": 0}, {"key": "34428424", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9843363505884031, "ground_truth": 0}, {"key": "36971005", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9462003537876489, "ground_truth": 0}, {"key": "36971005", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9572778040124555, "ground_truth": 0}, {"key": "36971005", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9515039983404074, "ground_truth": 0}, {"key": "36971005", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110421502481, "ground_truth": 0}, {"key": "36971005", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9511422242919247, "ground_truth": 0}, {"key": "34649067", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.18832399225714883, "ground_truth": 0}, {"key": "34649067", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2200070910978149, "ground_truth": 0}, {"key": "34649067", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.17895589069623474, "ground_truth": 0}, {"key": "34649067", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418580334565, "ground_truth": 0}, {"key": "34649067", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2974699380029093, "ground_truth": 0}, {"key": "37355154", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.09138210243312755, "ground_truth": 0}, {"key": "37355154", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42632159337849046, "ground_truth": 0}, {"key": "37355154", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.19436781192217398, "ground_truth": 0}, {"key": "37355154", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124121572878819, "ground_truth": 0}, {"key": "37355154", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.0933468750334287, "ground_truth": 0}, {"key": "38674697", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5964331278200522, "ground_truth": 0}, {"key": "38674697", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3522017906653639, "ground_truth": 0}, {"key": "38674697", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6352224290885901, "ground_truth": 0}, {"key": "38674697", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269999909063, "ground_truth": 0}, {"key": "38674697", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786333369734, "ground_truth": 0}, {"key": "40525767", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9838471643569696, "ground_truth": 0}, {"key": "40525767", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9950563108685584, "ground_truth": 0}, {"key": "40525767", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9899086852678526, "ground_truth": 0}, {"key": "40525767", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9872772919245135, "ground_truth": 0}, {"key": "40525767", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9832145086300821, "ground_truth": 0}, {"key": "27165110", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.19072402284980694, "ground_truth": 0}, {"key": "27165110", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.445529528581181, "ground_truth": 0}, {"key": "27165110", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.08210662862631515, "ground_truth": 0}, {"key": "27165110", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808758400421, "ground_truth": 0}, {"key": "27165110", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1666754049041728, "ground_truth": 0}, {"key": "35497491", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6774740242702381, "ground_truth": 0}, {"key": "35497491", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717666101407987, "ground_truth": 0}, {"key": "35497491", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.756357569675081, "ground_truth": 0}, {"key": "35497491", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299933922895, "ground_truth": 0}, {"key": "35497491", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253685864538, "ground_truth": 0}, {"key": "40690716", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7918210763257475, "ground_truth": 0}, {"key": "40690716", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8749346149114158, "ground_truth": 0}, {"key": "40690716", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8679338359425287, "ground_truth": 0}, {"key": "40690716", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933718317206, "ground_truth": 0}, {"key": "40690716", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104537216616, "ground_truth": 0}, {"key": "34835193", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9656413119909923, "ground_truth": 0}, {"key": "34835193", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9850429138641359, "ground_truth": 0}, {"key": "34835193", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9695556528065672, "ground_truth": 0}, {"key": "34835193", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9817357202132485, "ground_truth": 0}, {"key": "34835193", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9857180666272827, "ground_truth": 0}, {"key": "39471712", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5234203292274558, "ground_truth": 0}, {"key": "39471712", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7233094557707136, "ground_truth": 0}, {"key": "39471712", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4902356079456775, "ground_truth": 0}, {"key": "39471712", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512053099016, "ground_truth": 0}, {"key": "39471712", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593378012168, "ground_truth": 0}, {"key": "39115192", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8740772407728957, "ground_truth": 0}, {"key": "39115192", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7520125471470436, "ground_truth": 0}, {"key": "39115192", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.854884643328921, "ground_truth": 0}, {"key": "39115192", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082728865103, "ground_truth": 0}, {"key": "39115192", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919999504304, "ground_truth": 0}, {"key": "23520673", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.22000709343461602, "ground_truth": 0}, {"key": "23520673", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.25982563118533614, "ground_truth": 0}, {"key": "23520673", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32252597476879097, "ground_truth": 0}, {"key": "23520673", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552953715107496, "ground_truth": 0}, {"key": "23520673", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2146914354846585, "ground_truth": 0}, {"key": "35764233", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6020615804379517, "ground_truth": 0}, {"key": "35764233", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45907614412761955, "ground_truth": 0}, {"key": "35764233", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5370413619385019, "ground_truth": 0}, {"key": "35764233", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902355856723167, "ground_truth": 0}, {"key": "35764233", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "35228910", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.22953520631454163, "ground_truth": 0}, {"key": "35228910", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.30735801747457087, "ground_truth": 0}, {"key": "35228910", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4902356186828472, "ground_truth": 0}, {"key": "35228910", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463116890166746, "ground_truth": 0}, {"key": "35228910", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1581743618943946, "ground_truth": 0}, {"key": "36795599", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9019206740201405, "ground_truth": 0}, {"key": "36795599", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8791467618514193, "ground_truth": 0}, {"key": "36795599", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.865224089054239, "ground_truth": 0}, {"key": "36795599", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9394706126323278, "ground_truth": 0}, {"key": "36795599", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213731820344, "ground_truth": 0}, {"key": "38641949", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.834406897196258, "ground_truth": 0}, {"key": "38641949", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.808067200880486, "ground_truth": 0}, {"key": "38641949", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7634837840328036, "ground_truth": 0}, {"key": "38641949", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337048076341, "ground_truth": 0}, {"key": "38641949", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624716534566, "ground_truth": 0}, {"key": "29968443", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8757870021403367, "ground_truth": 0}, {"key": "29968443", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.847967754760497, "ground_truth": 0}, {"key": "29968443", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9635062341950048, "ground_truth": 0}, {"key": "29968443", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149036501488, "ground_truth": 0}, {"key": "29968443", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288490913212, "ground_truth": 0}, {"key": "21268042", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7356416430038597, "ground_truth": 0}, {"key": "21268042", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8255897276816763, "ground_truth": 0}, {"key": "21268042", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7786493040279375, "ground_truth": 0}, {"key": "21268042", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338420597366, "ground_truth": 0}, {"key": "21268042", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585863191628, "ground_truth": 0}, {"key": "26808572", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5755880246684101, "ground_truth": 0}, {"key": "26808572", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5945512744349012, "ground_truth": 0}, {"key": "26808572", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5964331470571678, "ground_truth": 0}, {"key": "26808572", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526355981227, "ground_truth": 0}, {"key": "26808572", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760149454515, "ground_truth": 0}, {"key": "37829390", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8624675295616374, "ground_truth": 0}, {"key": "37829390", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7981867799916205, "ground_truth": 0}, {"key": "37829390", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7879312015426067, "ground_truth": 0}, {"key": "37829390", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545555017464, "ground_truth": 0}, {"key": "37829390", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545607032632, "ground_truth": 0}, {"key": "35716045", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8933093975042371, "ground_truth": 0}, {"key": "35716045", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8783142515513053, "ground_truth": 0}, {"key": "35716045", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9441768611925101, "ground_truth": 0}, {"key": "35716045", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677361703563, "ground_truth": 0}, {"key": "35716045", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213788728349, "ground_truth": 0}, {"key": "34367070", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8947894582499181, "ground_truth": 0}, {"key": "34367070", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8991213813445692, "ground_truth": 0}, {"key": "34367070", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9118099522849157, "ground_truth": 0}, {"key": "34367070", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9273632937947456, "ground_truth": 0}, {"key": "34367070", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391657281323, "ground_truth": 0}, {"key": "35239748", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8116760202102754, "ground_truth": 0}, {"key": "35239748", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.713830767716867, "ground_truth": 0}, {"key": "35239748", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6992544063241934, "ground_truth": 0}, {"key": "35239748", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026777135957, "ground_truth": 0}, {"key": "35239748", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104583478272, "ground_truth": 0}, {"key": "40421370", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6039318389892134, "ground_truth": 0}, {"key": "40421370", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.588889131520953, "ground_truth": 0}, {"key": "40421370", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6242935550072927, "ground_truth": 0}, {"key": "40421370", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432012000945, "ground_truth": 0}, {"key": "40421370", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360044803715715, "ground_truth": 0}, {"key": "37288396", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8300437722081494, "ground_truth": 0}, {"key": "37288396", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.627951207281389, "ground_truth": 0}, {"key": "37288396", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7648916029452753, "ground_truth": 0}, {"key": "37288396", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689417253537, "ground_truth": 0}, {"key": "37288396", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281556223497, "ground_truth": 0}, {"key": "38903688", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.927887789092274, "ground_truth": 0}, {"key": "38903688", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9492946308487181, "ground_truth": 0}, {"key": "38903688", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9252299532845872, "ground_truth": 0}, {"key": "38903688", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9394706018621898, "ground_truth": 0}, {"key": "38903688", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.831143056711489, "ground_truth": 0}, {"key": "28071228", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8766343867363291, "ground_truth": 0}, {"key": "28071228", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9032942141846911, "ground_truth": 0}, {"key": "28071228", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9329437128284083, "ground_truth": 0}, {"key": "28071228", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9142907205502137, "ground_truth": 0}, {"key": "28071228", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099498646016, "ground_truth": 0}, {"key": "36855834", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5467381719087056, "ground_truth": 0}, {"key": "36855834", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5525397056028647, "ground_truth": 0}, {"key": "36855834", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4130035723527961, "ground_truth": 0}, {"key": "36855834", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203557670973, "ground_truth": 0}, {"key": "36855834", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632817286981, "ground_truth": 0}, {"key": "40548717", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3575675174299327, "ground_truth": 0}, {"key": "40548717", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.30404168174954405, "ground_truth": 0}, {"key": "40548717", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5097644243580699, "ground_truth": 0}, {"key": "40548717", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3311197114245262, "ground_truth": 0}, {"key": "40548717", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.345105282523498, "ground_truth": 0}, {"key": "37051175", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7371581473665935, "ground_truth": 0}, {"key": "37051175", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5544704833963774, "ground_truth": 0}, {"key": "37051175", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6242935269900185, "ground_truth": 0}, {"key": "37051175", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197756323218, "ground_truth": 0}, {"key": "37051175", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737905786688, "ground_truth": 0}, {"key": "38882119", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.872347367804543, "ground_truth": 0}, {"key": "38882119", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7248702867855016, "ground_truth": 0}, {"key": "38882119", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7879312155727757, "ground_truth": 0}, {"key": "38882119", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894762332989, "ground_truth": 0}, {"key": "38882119", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918247957744, "ground_truth": 0}, {"key": "19485402", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8044059166067916, "ground_truth": 0}, {"key": "19485402", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6706082850585487, "ground_truth": 0}, {"key": "19485402", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7592253997275252, "ground_truth": 0}, {"key": "19485402", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527491711596, "ground_truth": 0}, {"key": "19485402", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884718202006, "ground_truth": 0}, {"key": "36060907", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.602061582794641, "ground_truth": 0}, {"key": "36060907", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6531269180536479, "ground_truth": 0}, {"key": "36060907", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.803173790146843, "ground_truth": 0}, {"key": "36060907", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754311784803, "ground_truth": 0}, {"key": "36060907", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929098470997, "ground_truth": 0}, {"key": "24037309", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7041601568825521, "ground_truth": 0}, {"key": "24037309", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8568122949967737, "ground_truth": 0}, {"key": "24037309", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9032942113222174, "ground_truth": 0}, {"key": "24037309", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737320489482, "ground_truth": 0}, {"key": "24037309", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704648012596202, "ground_truth": 0}, {"key": "35605805", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6619228712155064, "ground_truth": 0}, {"key": "35605805", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8354835283173806, "ground_truth": 0}, {"key": "35605805", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6943026714940342, "ground_truth": 0}, {"key": "35605805", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947187941192, "ground_truth": 0}, {"key": "35605805", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366520752349, "ground_truth": 0}, {"key": "17706248", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4092207691279821, "ground_truth": 0}, {"key": "17706248", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3647775498698408, "ground_truth": 0}, {"key": "17706248", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.23091975341442697, "ground_truth": 0}, {"key": "17706248", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.41300358606614346, "ground_truth": 0}, {"key": "17706248", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969046201943, "ground_truth": 0}, {"key": "36883559", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7620701102286775, "ground_truth": 0}, {"key": "36883559", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7041601616271408, "ground_truth": 0}, {"key": "36883559", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.689305657042868, "ground_truth": 0}, {"key": "36883559", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947232934211, "ground_truth": 0}, {"key": "36883559", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544147736319, "ground_truth": 0}, {"key": "32799471", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9032942115486552, "ground_truth": 0}, {"key": "32799471", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8615382075520261, "ground_truth": 0}, {"key": "32799471", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8879840675534948, "ground_truth": 0}, {"key": "32799471", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737853063802, "ground_truth": 0}, {"key": "32799471", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933435884748, "ground_truth": 0}, {"key": "34797243", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.35220180119617506, "ground_truth": 0}, {"key": "34797243", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6224593576621751, "ground_truth": 0}, {"key": "34797243", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5794004039749759, "ground_truth": 0}, {"key": "34797243", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121724603965, "ground_truth": 0}, {"key": "34797243", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966239484445, "ground_truth": 0}, {"key": "32154876", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.38491216229533903, "ground_truth": 0}, {"key": "32154876", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43782350241422613, "ground_truth": 0}, {"key": "32154876", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.44746029197077514, "ground_truth": 0}, {"key": "32154876", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3140505597446587, "ground_truth": 0}, {"key": "32154876", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076629735826108, "ground_truth": 0}, {"key": "37962274", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7279754529315123, "ground_truth": 0}, {"key": "37962274", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5448013901803627, "ground_truth": 0}, {"key": "37962274", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5312093882480953, "ground_truth": 0}, {"key": "37962274", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802280762606, "ground_truth": 0}, {"key": "37962274", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762771077396, "ground_truth": 0}, {"key": "35574030", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4571367302101404, "ground_truth": 0}, {"key": "35574030", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6297746067407115, "ground_truth": 0}, {"key": "35574030", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7401743515668472, "ground_truth": 0}, {"key": "35574030", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544468973042, "ground_truth": 0}, {"key": "35574030", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.537041379263165, "ground_truth": 0}, {"key": "39105949", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7154239841084502, "ground_truth": 0}, {"key": "39105949", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7772998614482491, "ground_truth": 0}, {"key": "39105949", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7826624853402498, "ground_truth": 0}, {"key": "39105949", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681041099733, "ground_truth": 0}, {"key": "39105949", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104539863545, "ground_truth": 0}, {"key": "41064322", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9529258255291229, "ground_truth": 0}, {"key": "41064322", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9489172688408521, "ground_truth": 0}, {"key": "41064322", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9805806511537816, "ground_truth": 0}, {"key": "41064322", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9790357607470567, "ground_truth": 0}, {"key": "41064322", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9700134938063532, "ground_truth": 0}, {"key": "28105101", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8529354691097247, "ground_truth": 0}, {"key": "28105101", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7325918393416325, "ground_truth": 0}, {"key": "28105101", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8606036139714672, "ground_truth": 0}, {"key": "28105101", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.774583384461947, "ground_truth": 0}, {"key": "28105101", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784041954492, "ground_truth": 0}, {"key": "36036068", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6095241371661804, "ground_truth": 0}, {"key": "36036068", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6926419679118668, "ground_truth": 0}, {"key": "36036068", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8233283975034692, "ground_truth": 0}, {"key": "36036068", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577680961677854, "ground_truth": 0}, {"key": "36036068", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578334619775, "ground_truth": 0}, {"key": "37991460", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.513668439246349, "ground_truth": 0}, {"key": "37991460", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7943849571215202, "ground_truth": 0}, {"key": "37991460", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.418696923106144, "ground_truth": 0}, {"key": "37991460", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898526550575, "ground_truth": 0}, {"key": "37991460", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504837681972, "ground_truth": 0}, {"key": "38437830", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6095241618055659, "ground_truth": 0}, {"key": "38437830", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6688802518486386, "ground_truth": 0}, {"key": "38437830", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.873214834199203, "ground_truth": 0}, {"key": "38437830", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897189185588, "ground_truth": 0}, {"key": "38437830", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210843876797, "ground_truth": 0}, {"key": "36507138", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7122321966620517, "ground_truth": 0}, {"key": "36507138", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.44939261887121296, "ground_truth": 0}, {"key": "36507138", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6039318449649489, "ground_truth": 0}, {"key": "36507138", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011557131278, "ground_truth": 0}, {"key": "36507138", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239966432949, "ground_truth": 0}, {"key": "37824866", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7341195312333362, "ground_truth": 0}, {"key": "37824866", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9105453982823271, "ground_truth": 0}, {"key": "37824866", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059019331082, "ground_truth": 0}, {"key": "37824866", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578386249159, "ground_truth": 0}, {"key": "37824866", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.640635830845014, "ground_truth": 0}, {"key": "25088134", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.720171500242792, "ground_truth": 0}, {"key": "25088134", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.718594384798659, "ground_truth": 0}, {"key": "25088134", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6057990182335697, "ground_truth": 0}, {"key": "25088134", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804415946452, "ground_truth": 0}, {"key": "25088134", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982221589155, "ground_truth": 0}, {"key": "40172531", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8175744919212373, "ground_truth": 0}, {"key": "40172531", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8289388108434139, "ground_truth": 0}, {"key": "40172531", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8210441296679378, "ground_truth": 0}, {"key": "40172531", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677547775194, "ground_truth": 0}, {"key": "40172531", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311877253573, "ground_truth": 0}, {"key": "37035874", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46101676667323604, "ground_truth": 0}, {"key": "37035874", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5486734906072894, "ground_truth": 0}, {"key": "37035874", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32423540804218015, "ground_truth": 0}, {"key": "37035874", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906296524508, "ground_truth": 0}, {"key": "37035874", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.31405056494919653, "ground_truth": 0}, {"key": "36404465", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.974821157398271, "ground_truth": 0}, {"key": "36404465", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9858276342164495, "ground_truth": 0}, {"key": "36404465", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9603611608353764, "ground_truth": 0}, {"key": "36404465", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9704646623423001, "ground_truth": 0}, {"key": "36404465", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9623913637254562, "ground_truth": 0}, {"key": "39602052", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031738017903797, "ground_truth": 0}, {"key": "39602052", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9032942137896732, "ground_truth": 0}, {"key": "39602052", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9477691414163033, "ground_truth": 0}, {"key": "39602052", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142395257922, "ground_truth": 0}, {"key": "39602052", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179856436435, "ground_truth": 0}, {"key": "33792789", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.42441199995211376, "ground_truth": 0}, {"key": "33792789", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6424324595718118, "ground_truth": 0}, {"key": "33792789", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6352224199719738, "ground_truth": 0}, {"key": "33792789", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.812867312505914, "ground_truth": 0}, {"key": "33792789", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256044482528, "ground_truth": 0}, {"key": "32776626", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.638835286016992, "ground_truth": 0}, {"key": "32776626", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.62977459237902, "ground_truth": 0}, {"key": "32776626", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3979384300632548, "ground_truth": 0}, {"key": "32776626", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413964983934, "ground_truth": 0}, {"key": "32776626", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618677570009, "ground_truth": 0}, {"key": "37195090", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4843800626661342, "ground_truth": 0}, {"key": "37195090", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804266317404, "ground_truth": 0}, {"key": "37195090", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.48438010894194716, "ground_truth": 0}, {"key": "37195090", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352925296187, "ground_truth": 0}, {"key": "37195090", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165313143707, "ground_truth": 0}, {"key": "33981824", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2735743975264877, "ground_truth": 0}, {"key": "33981824", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.26284185470591465, "ground_truth": 0}, {"key": "33981824", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3867634427982102, "ground_truth": 0}, {"key": "33981824", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242353937660444, "ground_truth": 0}, {"key": "33981824", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2323101564994243, "ground_truth": 0}, {"key": "39569142", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5813031026849532, "ground_truth": 0}, {"key": "39569142", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.533154405944699, "ground_truth": 0}, {"key": "39569142", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5525396930886312, "ground_truth": 0}, {"key": "39569142", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102690150784, "ground_truth": 0}, {"key": "39569142", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333813319317, "ground_truth": 0}, {"key": "40268210", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7676898540687533, "ground_truth": 0}, {"key": "40268210", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256208092515, "ground_truth": 0}, {"key": "40268210", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8661325078362196, "ground_truth": 0}, {"key": "40268210", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9522199317716616, "ground_truth": 0}, {"key": "40268210", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711827941472, "ground_truth": 0}, {"key": "34925159", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7745833763659232, "ground_truth": 0}, {"key": "34925159", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8128673104523731, "ground_truth": 0}, {"key": "34925159", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8376199708871106, "ground_truth": 0}, {"key": "34925159", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872045905696405, "ground_truth": 0}, {"key": "34925159", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9376689623973355, "ground_truth": 0}, {"key": "36181903", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9362850098495413, "ground_truth": 0}, {"key": "36181903", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9362850016061574, "ground_truth": 0}, {"key": "36181903", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9579122702899567, "ground_truth": 0}, {"key": "36181903", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9532750445141231, "ground_truth": 0}, {"key": "36181903", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9394706168702368, "ground_truth": 0}, {"key": "38620559", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8104789081340454, "ground_truth": 0}, {"key": "38620559", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9219218409539603, "ground_truth": 0}, {"key": "38620559", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8848377704963823, "ground_truth": 0}, {"key": "38620559", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425320853994, "ground_truth": 0}, {"key": "38620559", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.931959586181166, "ground_truth": 0}, {"key": "32719657", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6039318392011873, "ground_truth": 0}, {"key": "32719657", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8910549568339452, "ground_truth": 0}, {"key": "32719657", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6442250692873545, "ground_truth": 0}, {"key": "32719657", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883474079349, "ground_truth": 0}, {"key": "32719657", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907612727851743, "ground_truth": 0}, {"key": "37530914", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40733340454132655, "ground_truth": 0}, {"key": "37530914", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5370413864631378, "ground_truth": 0}, {"key": "37530914", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43206339547238204, "ground_truth": 0}, {"key": "37530914", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358123316818, "ground_truth": 0}, {"key": "37530914", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "33306933", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9079671426969597, "ground_truth": 0}, {"key": "33306933", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9190632874006522, "ground_truth": 0}, {"key": "33306933", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9585377255505034, "ground_truth": 0}, {"key": "33306933", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361658116104, "ground_truth": 0}, {"key": "33306933", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346221360469, "ground_truth": 0}, {"key": "33837212", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7264256067991576, "ground_truth": 0}, {"key": "33837212", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5078118311304513, "ground_truth": 0}, {"key": "33837212", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7620701044383362, "ground_truth": 0}, {"key": "33837212", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.812867306082388, "ground_truth": 0}, {"key": "33837212", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121738063323, "ground_truth": 0}, {"key": "40945179", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7416740196734148, "ground_truth": 0}, {"key": "40945179", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7295197778669605, "ground_truth": 0}, {"key": "40945179", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7476159508456371, "ground_truth": 0}, {"key": "40945179", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624941545518, "ground_truth": 0}, {"key": "40945179", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867588879419, "ground_truth": 0}, {"key": "34152358", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2845760127593516, "ground_truth": 0}, {"key": "34152358", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7201715231997355, "ground_truth": 0}, {"key": "34152358", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5907792002403044, "ground_truth": 0}, {"key": "34152358", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740258793596, "ground_truth": 0}, {"key": "34152358", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436003867152202, "ground_truth": 0}, {"key": "34136541", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8848377722206814, "ground_truth": 0}, {"key": "34136541", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8210441142594553, "ground_truth": 0}, {"key": "34136541", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7520125969030245, "ground_truth": 0}, {"key": "34136541", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256558145247, "ground_truth": 0}, {"key": "34136541", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059557592975, "ground_truth": 0}, {"key": "37469603", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6279511957457509, "ground_truth": 0}, {"key": "37469603", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7461389781223459, "ground_truth": 0}, {"key": "37469603", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575604523315, "ground_truth": 0}, {"key": "37469603", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269914093166, "ground_truth": 0}, {"key": "37469603", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059295852483, "ground_truth": 0}, {"key": "37353611", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9623913603915837, "ground_truth": 0}, {"key": "37353611", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9278878007559643, "ground_truth": 0}, {"key": "37353611", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8872045888207769, "ground_truth": 0}, {"key": "37353611", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9184802455950337, "ground_truth": 0}, {"key": "37353611", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437153647013, "ground_truth": 0}, {"key": "37211649", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5755880170269307, "ground_truth": 0}, {"key": "37211649", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7892336977982054, "ground_truth": 0}, {"key": "37211649", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7981867856054922, "ground_truth": 0}, {"key": "37211649", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494522865364, "ground_truth": 0}, {"key": "37211649", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606820101058626, "ground_truth": 0}, {"key": "37320976", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8386797631409252, "ground_truth": 0}, {"key": "37320976", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7490872259378512, "ground_truth": 0}, {"key": "37320976", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8558511447029876, "ground_truth": 0}, {"key": "37320976", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942292633849, "ground_truth": 0}, {"key": "37320976", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528213418018, "ground_truth": 0}, {"key": "34492412", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9469902298555262, "ground_truth": 0}, {"key": "34492412", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8104789227664643, "ground_truth": 0}, {"key": "34492412", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9753900704690736, "ground_truth": 0}, {"key": "34492412", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675326092417, "ground_truth": 0}, {"key": "34492412", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9500414756327, "ground_truth": 0}, {"key": "36655016", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9600626855162856, "ground_truth": 0}, {"key": "36655016", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9453993935396401, "ground_truth": 0}, {"key": "36655016", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9621075746939726, "ground_truth": 0}, {"key": "36655016", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9664104952298714, "ground_truth": 0}, {"key": "36655016", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9615338077395789, "ground_truth": 0}, {"key": "35220773", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8092759692404409, "ground_truth": 0}, {"key": "35220773", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.445529496806553, "ground_truth": 0}, {"key": "35220773", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8152324945473881, "ground_truth": 0}, {"key": "35220773", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918393141876, "ground_truth": 0}, {"key": "35220773", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493148811731, "ground_truth": 0}, {"key": "31569808", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5888891367454879, "ground_truth": 0}, {"key": "31569808", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3293917131674871, "ground_truth": 0}, {"key": "31569808", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5945512915145207, "ground_truth": 0}, {"key": "31569808", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918408375807, "ground_truth": 0}, {"key": "31569808", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197803052069, "ground_truth": 0}, {"key": "37696256", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49023563893541916, "ground_truth": 0}, {"key": "37696256", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.613236523690287, "ground_truth": 0}, {"key": "37696256", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.48633154868890754, "ground_truth": 0}, {"key": "37696256", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203548686505, "ground_truth": 0}, {"key": "37696256", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102359743968, "ground_truth": 0}, {"key": "36874328", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7732163801403673, "ground_truth": 0}, {"key": "36874328", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8006919962959417, "ground_truth": 0}, {"key": "36874328", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8969755756516191, "ground_truth": 0}, {"key": "36874328", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823461163766, "ground_truth": 0}, {"key": "36874328", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148427452883, "ground_truth": 0}, {"key": "24532377", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.30239107648241476, "ground_truth": 0}, {"key": "24532377", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.268941427273096, "ground_truth": 0}, {"key": "24532377", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3293917179328761, "ground_truth": 0}, {"key": "24532377", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.29746994021089807, "ground_truth": 0}, {"key": "24532377", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2613309364970514, "ground_truth": 0}, {"key": "39560618", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7759445638290446, "ground_truth": 0}, {"key": "39560618", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6619228515874932, "ground_truth": 0}, {"key": "39560618", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6992544087415183, "ground_truth": 0}, {"key": "39560618", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085852595596, "ground_truth": 0}, {"key": "39560618", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.667147708797633, "ground_truth": 0}, {"key": "34922693", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.24220563893726865, "ground_truth": 0}, {"key": "34922693", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.18952109971605868, "ground_truth": 0}, {"key": "34922693", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1766716043638558, "ground_truth": 0}, {"key": "34922693", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405545854371342, "ground_truth": 0}, {"key": "34922693", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2465333357649114, "ground_truth": 0}, {"key": "33629577", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5679365847535328, "ground_truth": 0}, {"key": "33629577", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6876299810901966, "ground_truth": 0}, {"key": "33629577", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774739955574416, "ground_truth": 0}, {"key": "33629577", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386691046274155, "ground_truth": 0}, {"key": "33629577", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165404320524, "ground_truth": 0}, {"key": "32284359", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.694302669949875, "ground_truth": 0}, {"key": "32284359", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.538983209071903, "ground_truth": 0}, {"key": "32284359", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.45907613473906284, "ground_truth": 0}, {"key": "32284359", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026875840523, "ground_truth": 0}, {"key": "32284359", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918484197608, "ground_truth": 0}, {"key": "28082962", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6132365511247851, "ground_truth": 0}, {"key": "28082962", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.32082128978119323, "ground_truth": 0}, {"key": "28082962", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5774953448201168, "ground_truth": 0}, {"key": "28082962", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324878497526, "ground_truth": 0}, {"key": "28082962", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786051983311, "ground_truth": 0}, {"key": "24796803", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7662936513955895, "ground_truth": 0}, {"key": "24796803", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8233283969482141, "ground_truth": 0}, {"key": "24796803", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8221891238108284, "ground_truth": 0}, {"key": "24796803", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.851952805531735, "ground_truth": 0}, {"key": "24796803", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849619580389, "ground_truth": 0}, {"key": "35466150", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.752012560967613, "ground_truth": 0}, {"key": "35466150", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6909762905782618, "ground_truth": 0}, {"key": "35466150", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8198933397742894, "ground_truth": 0}, {"key": "35466150", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284089804328, "ground_truth": 0}, {"key": "35466150", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615566365272, "ground_truth": 0}, {"key": "35754289", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.927887797222848, "ground_truth": 0}, {"key": "35754289", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8832359908341835, "ground_truth": 0}, {"key": "35754289", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.928408805773231, "ground_truth": 0}, {"key": "35754289", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267118081742397, "ground_truth": 0}, {"key": "35754289", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840520244011, "ground_truth": 0}, {"key": "36678662", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9553191300544089, "ground_truth": 0}, {"key": "36678662", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9609517065839523, "ground_truth": 0}, {"key": "36678662", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9263037266415092, "ground_truth": 0}, {"key": "36678662", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849599205913, "ground_truth": 0}, {"key": "36678662", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748752089767, "ground_truth": 0}, {"key": "35399671", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9429286051413629, "ground_truth": 0}, {"key": "35399671", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8187367750419472, "ground_truth": 0}, {"key": "35399671", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9005297947326923, "ground_truth": 0}, {"key": "35399671", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9481545324615913, "ground_truth": 0}, {"key": "35399671", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907190835026, "ground_truth": 0}, {"key": "36888180", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7476159568827506, "ground_truth": 0}, {"key": "36888180", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6909762934287637, "ground_truth": 0}, {"key": "36888180", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7732163732423176, "ground_truth": 0}, {"key": "36888180", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918363494697, "ground_truth": 0}, {"key": "36888180", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737373901817, "ground_truth": 0}, {"key": "28061069", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832157717324, "ground_truth": 0}, {"key": "28061069", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5389832320265471, "ground_truth": 0}, {"key": "28061069", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5039061877437259, "ground_truth": 0}, {"key": "28061069", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735116858159, "ground_truth": 0}, {"key": "28061069", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641285845169, "ground_truth": 0}, {"key": "22259982", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5136684698441509, "ground_truth": 0}, {"key": "22259982", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4092208047535121, "ground_truth": 0}, {"key": "22259982", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5602526587789142, "ground_truth": 0}, {"key": "22259982", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092207784856521, "ground_truth": 0}, {"key": "22259982", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569731190078875, "ground_truth": 0}, {"key": "34026805", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8449215320017801, "ground_truth": 0}, {"key": "34026805", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9111797101962475, "ground_truth": 0}, {"key": "34026805", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7732163719414225, "ground_truth": 0}, {"key": "34026805", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159418892053, "ground_truth": 0}, {"key": "34026805", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.874077232971317, "ground_truth": 0}, {"key": "36713809", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.839733962375714, "ground_truth": 0}, {"key": "36713809", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9329437142334525, "ground_truth": 0}, {"key": "36713809", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9118099529973487, "ground_truth": 0}, {"key": "36713809", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755774186317, "ground_truth": 0}, {"key": "36713809", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352807170339, "ground_truth": 0}, {"key": "39726411", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5660185345545794, "ground_truth": 0}, {"key": "39726411", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3775406628873103, "ground_truth": 0}, {"key": "39726411", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4244120013473514, "ground_truth": 0}, {"key": "39726411", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158249393000834, "ground_truth": 0}, {"key": "39726411", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869690599107673, "ground_truth": 0}, {"key": "37069841", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7248702695655387, "ground_truth": 0}, {"key": "37069841", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.87663438848956, "ground_truth": 0}, {"key": "37069841", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7505527705741152, "ground_truth": 0}, {"key": "37069841", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689793697954, "ground_truth": 0}, {"key": "37069841", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647107856635, "ground_truth": 0}, {"key": "38894693", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832079760439, "ground_truth": 0}, {"key": "38894693", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.529263365974354, "ground_truth": 0}, {"key": "38894693", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5602526354232823, "ground_truth": 0}, {"key": "38894693", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737347463203, "ground_truth": 0}, {"key": "38894693", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282897280211, "ground_truth": 0}, {"key": "33946032", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.97557691034526, "ground_truth": 0}, {"key": "33946032", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9846936456621039, "ground_truth": 0}, {"key": "33946032", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9676556693958758, "ground_truth": 0}, {"key": "33946032", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009479491925, "ground_truth": 0}, {"key": "33946032", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9569571498779305, "ground_truth": 0}, {"key": "39035311", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8991213805488147, "ground_truth": 0}, {"key": "39035311", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9026096018906241, "ground_truth": 0}, {"key": "39035311", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.894051720001609, "ground_truth": 0}, {"key": "39035311", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430462838474, "ground_truth": 0}, {"key": "39035311", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059667176756, "ground_truth": 0}, {"key": "27680038", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3225260019397452, "ground_truth": 0}, {"key": "27680038", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.635222452734788, "ground_truth": 0}, {"key": "27680038", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5679366185699823, "ground_truth": 0}, {"key": "27680038", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.585101163969914, "ground_truth": 0}, {"key": "27680038", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922081310996294, "ground_truth": 0}, {"key": "36901907", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6242935328356489, "ground_truth": 0}, {"key": "36901907", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6926419907118597, "ground_truth": 0}, {"key": "36901907", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8056321840300394, "ground_truth": 0}, {"key": "36901907", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581752971997, "ground_truth": 0}, {"key": "36901907", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786344934007, "ground_truth": 0}, {"key": "21530542", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6477982312157612, "ground_truth": 0}, {"key": "21530542", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7090191595174102, "ground_truth": 0}, {"key": "21530542", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6654105707849789, "ground_truth": 0}, {"key": "21530542", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097644070639069, "ground_truth": 0}, {"key": "21530542", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893055895724518, "ground_truth": 0}, {"key": "38192532", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8766343814752989, "ground_truth": 0}, {"key": "38192532", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9241418185405832, "ground_truth": 0}, {"key": "38192532", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8991213840788662, "ground_truth": 0}, {"key": "38192532", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204150985817, "ground_truth": 0}, {"key": "38192532", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358154959919, "ground_truth": 0}, {"key": "34102400", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2958398680531496, "ground_truth": 0}, {"key": "34102400", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.12592276015362014, "ground_truth": 0}, {"key": "34102400", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22953522161444423, "ground_truth": 0}, {"key": "34102400", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469142454790877, "ground_truth": 0}, {"key": "34102400", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.23231013948825008, "ground_truth": 0}, {"key": "36133399", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7154240064009297, "ground_truth": 0}, {"key": "36133399", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.895522676626505, "ground_truth": 0}, {"key": "36133399", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8289388008952094, "ground_truth": 0}, {"key": "36133399", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797559332373, "ground_truth": 0}, {"key": "36133399", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947402939029, "ground_truth": 0}, {"key": "34314544", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.834406893645074, "ground_truth": 0}, {"key": "34314544", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7057850421191832, "ground_truth": 0}, {"key": "34314544", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7233094691141349, "ground_truth": 0}, {"key": "34314544", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.858718575295432, "ground_truth": 0}, {"key": "34314544", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.661922874625993, "ground_truth": 0}, {"key": "33460074", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575566882964, "ground_truth": 0}, {"key": "33460074", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8418256555299776, "ground_truth": 0}, {"key": "33460074", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059023351299, "ground_truth": 0}, {"key": "33460074", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118784958526, "ground_truth": 0}, {"key": "33460074", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493225921495, "ground_truth": 0}, {"key": "36191495", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199211678739, "ground_truth": 0}, {"key": "36191495", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757645967444577, "ground_truth": 0}, {"key": "36191495", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6224593162713138, "ground_truth": 0}, {"key": "36191495", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307530393544, "ground_truth": 0}, {"key": "36191495", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953520365219, "ground_truth": 0}, {"key": "39532668", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9489172611635969, "ground_truth": 0}, {"key": "39532668", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9202179859467764, "ground_truth": 0}, {"key": "39532668", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7745833718635573, "ground_truth": 0}, {"key": "39532668", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506552876993, "ground_truth": 0}, {"key": "39532668", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424358132298, "ground_truth": 0}, {"key": "20328247", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5312093731255138, "ground_truth": 0}, {"key": "20328247", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.37754066934663816, "ground_truth": 0}, {"key": "20328247", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5234203539143913, "ground_truth": 0}, {"key": "20328247", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633759994759, "ground_truth": 0}, {"key": "20328247", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601724003312506, "ground_truth": 0}, {"key": "39112675", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6057990675769042, "ground_truth": 0}, {"key": "39112675", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358389639167, "ground_truth": 0}, {"key": "39112675", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8376199727585351, "ground_truth": 0}, {"key": "39112675", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307504447561, "ground_truth": 0}, {"key": "39112675", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300820846935, "ground_truth": 0}, {"key": "31620300", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7606506482220368, "ground_truth": 0}, {"key": "31620300", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251173650411, "ground_truth": 0}, {"key": "31620300", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6808786067303675, "ground_truth": 0}, {"key": "31620300", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740355772912, "ground_truth": 0}, {"key": "31620300", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631812144442, "ground_truth": 0}, {"key": "37518509", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.30735800438249444, "ground_truth": 0}, {"key": "37518509", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3468730847912088, "ground_truth": 0}, {"key": "37518509", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5253688401903973, "ground_truth": 0}, {"key": "37518509", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381441283508, "ground_truth": 0}, {"key": "37518509", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804787106974774, "ground_truth": 0}, {"key": "35454095", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7759445566586879, "ground_truth": 0}, {"key": "35454095", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8998277832461777, "ground_truth": 0}, {"key": "35454095", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7839884675665004, "ground_truth": 0}, {"key": "35454095", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624846198341, "ground_truth": 0}, {"key": "35454095", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493161361376, "ground_truth": 0}, {"key": "38542788", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9623913636784203, "ground_truth": 0}, {"key": "38542788", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9394706133599302, "ground_truth": 0}, {"key": "38542788", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9416541622303086, "ground_truth": 0}, {"key": "38542788", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9563089435066071, "ground_truth": 0}, {"key": "38542788", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9532750464443683, "ground_truth": 0}, {"key": "23944937", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6992544192905834, "ground_truth": 0}, {"key": "23944937", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4016877967609553, "ground_truth": 0}, {"key": "23944937", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490872133431244, "ground_truth": 0}, {"key": "23944937", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416344277981, "ground_truth": 0}, {"key": "23944937", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307876887179, "ground_truth": 0}, {"key": "31753944", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44746029046581315, "ground_truth": 0}, {"key": "31753944", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.47852879781358554, "ground_truth": 0}, {"key": "31753944", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4882834083764399, "ground_truth": 0}, {"key": "31753944", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.560252620495346, "ground_truth": 0}, {"key": "31753944", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213019733231, "ground_truth": 0}, {"key": "35527214", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.759225392535485, "ground_truth": 0}, {"key": "35527214", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8697145737161797, "ground_truth": 0}, {"key": "35527214", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7446563231374757, "ground_truth": 0}, {"key": "35527214", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909763114922798, "ground_truth": 0}, {"key": "35527214", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998639045547, "ground_truth": 0}, {"key": "40400404", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9629528317000626, "ground_truth": 0}, {"key": "40400404", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9546474198210597, "ground_truth": 0}, {"key": "40400404", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9623913621167116, "ground_truth": 0}, {"key": "40400404", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9429286023416252, "ground_truth": 0}, {"key": "40400404", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.948917266525758, "ground_truth": 0}, {"key": "21713119", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5039061601372827, "ground_truth": 0}, {"key": "21713119", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5039061635404305, "ground_truth": 0}, {"key": "21713119", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4571367300339024, "ground_truth": 0}, {"key": "21713119", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315495814809, "ground_truth": 0}, {"key": "21713119", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3575675089335179, "ground_truth": 0}, {"key": "28730678", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.867933836238841, "ground_truth": 0}, {"key": "28730678", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8311430500112158, "ground_truth": 0}, {"key": "28730678", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8606036235630107, "ground_truth": 0}, {"key": "28730678", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675321464881, "ground_truth": 0}, {"key": "28730678", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122980876425, "ground_truth": 0}, {"key": "36823733", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8044059087836074, "ground_truth": 0}, {"key": "36823733", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6566582456009358, "ground_truth": 0}, {"key": "36823733", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8244619329585459, "ground_truth": 0}, {"key": "36823733", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.747615943091049, "ground_truth": 0}, {"key": "36823733", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624746623381, "ground_truth": 0}, {"key": "35988862", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41489885329589965, "ground_truth": 0}, {"key": "35988862", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3311197330777645, "ground_truth": 0}, {"key": "35988862", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49609381298958793, "ground_truth": 0}, {"key": "35988862", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966358096377, "ground_truth": 0}, {"key": "35988862", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244119684036206, "ground_truth": 0}, {"key": "40499665", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9429286007387048, "ground_truth": 0}, {"key": "40499665", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9420819157802064, "ground_truth": 0}, {"key": "40499665", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8749346055949007, "ground_truth": 0}, {"key": "40499665", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9556514213716373, "ground_truth": 0}, {"key": "40499665", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9536217951786522, "ground_truth": 0}, {"key": "32829820", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8354835304970573, "ground_truth": 0}, {"key": "32829820", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.734119542136682, "ground_truth": 0}, {"key": "32829820", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8006919895588112, "ground_truth": 0}, {"key": "32829820", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163597454554, "ground_truth": 0}, {"key": "32829820", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082616462673, "ground_truth": 0}, {"key": "20583553", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1634454307341428, "ground_truth": 0}, {"key": "20583553", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.19559406713544697, "ground_truth": 0}, {"key": "20583553", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22405542644697055, "ground_truth": 0}, {"key": "20583553", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375317503745, "ground_truth": 0}, {"key": "20583553", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2295351946635006, "ground_truth": 0}, {"key": "30501550", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8848377651596716, "ground_truth": 0}, {"key": "30501550", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8278281496183598, "ground_truth": 0}, {"key": "30501550", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8991213785528369, "ground_truth": 0}, {"key": "30501550", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361529427198, "ground_truth": 0}, {"key": "30501550", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837746035807, "ground_truth": 0}, {"key": "38755897", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6808786032141159, "ground_truth": 0}, {"key": "38755897", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3665897307840009, "ground_truth": 0}, {"key": "38755897", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056007518911, "ground_truth": 0}, {"key": "38755897", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828339990314495, "ground_truth": 0}, {"key": "38755897", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159577240741, "ground_truth": 0}, {"key": "35507201", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224405329128, "ground_truth": 0}, {"key": "35507201", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7476159452808065, "ground_truth": 0}, {"key": "35507201", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7956581001118347, "ground_truth": 0}, {"key": "35507201", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004043456973, "ground_truth": 0}, {"key": "35507201", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804198337847, "ground_truth": 0}, {"key": "36453511", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8955226711532378, "ground_truth": 0}, {"key": "36453511", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9643214492281583, "ground_truth": 0}, {"key": "36453511", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9178933640626363, "ground_truth": 0}, {"key": "36453511", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9334308214241852, "ground_truth": 0}, {"key": "36453511", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9445872106622779, "ground_truth": 0}, {"key": "38066835", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8449215195535591, "ground_truth": 0}, {"key": "38066835", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7905303425777335, "ground_truth": 0}, {"key": "38066835", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8539127469502905, "ground_truth": 0}, {"key": "38066835", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.753466642130909, "ground_truth": 0}, {"key": "38066835", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.87059726824282, "ground_truth": 0}, {"key": "39697181", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6876299717027016, "ground_truth": 0}, {"key": "39697181", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5774953483159142, "ground_truth": 0}, {"key": "39697181", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7185944093486344, "ground_truth": 0}, {"key": "39697181", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299991967533, "ground_truth": 0}, {"key": "39697181", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832133525261, "ground_truth": 0}, {"key": "21820893", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6206216507625625, "ground_truth": 0}, {"key": "21820893", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7233094853936876, "ground_truth": 0}, {"key": "21820893", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7264256080702123, "ground_truth": 0}, {"key": "21820893", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432224281851, "ground_truth": 0}, {"key": "21820893", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872250597562, "ground_truth": 0}, {"key": "40519933", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8092759766648034, "ground_truth": 0}, {"key": "40519933", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717665749253296, "ground_truth": 0}, {"key": "40519933", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6076631844666146, "ground_truth": 0}, {"key": "40519933", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.672331697517743, "ground_truth": 0}, {"key": "40519933", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743683004535, "ground_truth": 0}, {"key": "30446033", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.845942435541733, "ground_truth": 0}, {"key": "30446033", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.828938811742801, "ground_truth": 0}, {"key": "30446033", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8449215193049743, "ground_truth": 0}, {"key": "30446033", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063799201742, "ground_truth": 0}, {"key": "30446033", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152325018107428, "ground_truth": 0}, {"key": "40216291", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7476159359515252, "ground_truth": 0}, {"key": "40216291", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8596637613087914, "ground_truth": 0}, {"key": "40216291", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9462003538103457, "ground_truth": 0}, {"key": "40216291", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206821632004, "ground_truth": 0}, {"key": "40216291", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206782804358, "ground_truth": 0}, {"key": "33479118", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3611647153960987, "ground_truth": 0}, {"key": "33479118", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33285231370334717, "ground_truth": 0}, {"key": "33479118", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4225046128622968, "ground_truth": 0}, {"key": "33479118", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943792407766, "ground_truth": 0}, {"key": "33479118", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220178617724834, "ground_truth": 0}, {"key": "22297373", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.35936414426244756, "ground_truth": 0}, {"key": "22297373", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.1955940850693157, "ground_truth": 0}, {"key": "22297373", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42059959163941985, "ground_truth": 0}, {"key": "22297373", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436781983075094, "ground_truth": 0}, {"key": "22297373", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.18126322667978503, "ground_truth": 0}, {"key": "36463668", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1470645323070042, "ground_truth": 0}, {"key": "36463668", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42441199252942113, "ground_truth": 0}, {"key": "36463668", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3174262791107197, "ground_truth": 0}, {"key": "36463668", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.1871326778654812, "ground_truth": 0}, {"key": "36463668", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.28457602193613235, "ground_truth": 0}, {"key": "35264615", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6992544150950726, "ground_truth": 0}, {"key": "35264615", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8187368156046017, "ground_truth": 0}, {"key": "35264615", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.712232194371024, "ground_truth": 0}, {"key": "35264615", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175117275921, "ground_truth": 0}, {"key": "35264615", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918428976598, "ground_truth": 0}, {"key": "39898482", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9635062336688315, "ground_truth": 0}, {"key": "39898482", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9594592656691581, "ground_truth": 0}, {"key": "39898482", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9618217266659495, "ground_truth": 0}, {"key": "39898482", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9518632294377432, "ground_truth": 0}, {"key": "39898482", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.94292859895044, "ground_truth": 0}, {"key": "37228721", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8479677558774209, "ground_truth": 0}, {"key": "37228721", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8679338320127097, "ground_truth": 0}, {"key": "37228721", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7310585943398759, "ground_truth": 0}, {"key": "37228721", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445480499745, "ground_truth": 0}, {"key": "37228721", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526233700407, "ground_truth": 0}, {"key": "24535799", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8019358394925022, "ground_truth": 0}, {"key": "24535799", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9445872100864312, "ground_truth": 0}, {"key": "24535799", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8947894544397589, "ground_truth": 0}, {"key": "24535799", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338453333301, "ground_truth": 0}, {"key": "24535799", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204172048648, "ground_truth": 0}, {"key": "35177759", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8092759887047283, "ground_truth": 0}, {"key": "35177759", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7732163744988737, "ground_truth": 0}, {"key": "35177759", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8740772352583075, "ground_truth": 0}, {"key": "35177759", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631467189209, "ground_truth": 0}, {"key": "35177759", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894628594442, "ground_truth": 0}, {"key": "34364829", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.685949451181043, "ground_truth": 0}, {"key": "34364829", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7217432043755432, "ground_truth": 0}, {"key": "34364829", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7074047265145411, "ground_truth": 0}, {"key": "34364829", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030761243991, "ground_truth": 0}, {"key": "34364829", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740176138618, "ground_truth": 0}, {"key": "38090732", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8705972593437767, "ground_truth": 0}, {"key": "38090732", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8799743593633734, "ground_truth": 0}, {"key": "38090732", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.684264022644603, "ground_truth": 0}, {"key": "38090732", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511485978813, "ground_truth": 0}, {"key": "38090732", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517139434496, "ground_truth": 0}, {"key": "30651479", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6020615894002774, "ground_truth": 0}, {"key": "30651479", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7931059546220166, "ground_truth": 0}, {"key": "30651479", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8128673138725097, "ground_truth": 0}, {"key": "30651479", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528034512585, "ground_truth": 0}, {"key": "30651479", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381548379493, "ground_truth": 0}, {"key": "39380921", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5428633054091239, "ground_truth": 0}, {"key": "39380921", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40733342739204037, "ground_truth": 0}, {"key": "39380921", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4532618328010581, "ground_truth": 0}, {"key": "39380921", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704756688557, "ground_truth": 0}, {"key": "39380921", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668455981276006, "ground_truth": 0}, {"key": "39037490", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.24077458805063626, "ground_truth": 0}, {"key": "39037490", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.16451646300657058, "ground_truth": 0}, {"key": "39037490", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.10970576886972849, "ground_truth": 0}, {"key": "39037490", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.18359362912535107, "ground_truth": 0}, {"key": "39037490", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092207817526664, "ground_truth": 0}, {"key": "35917499", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8376199473531069, "ground_truth": 0}, {"key": "35917499", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9252299622580712, "ground_truth": 0}, {"key": "35917499", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8998277790966892, "ground_truth": 0}, {"key": "35917499", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256467726052, "ground_truth": 0}, {"key": "35917499", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840453131809, "ground_truth": 0}, {"key": "34908073", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8354835272776326, "ground_truth": 0}, {"key": "34908073", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8499711803119434, "ground_truth": 0}, {"key": "34908073", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704647906272081, "ground_truth": 0}, {"key": "34908073", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.752012558412865, "ground_truth": 0}, {"key": "34908073", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011703527147, "ground_truth": 0}, {"key": "36344759", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8749346170820218, "ground_truth": 0}, {"key": "36344759", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6706082945617408, "ground_truth": 0}, {"key": "36344759", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7892337074699008, "ground_truth": 0}, {"key": "36344759", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952890277221, "ground_truth": 0}, {"key": "36344759", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435105766498, "ground_truth": 0}, {"key": "39984637", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7356416621273261, "ground_truth": 0}, {"key": "39984637", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7386690685249299, "ground_truth": 0}, {"key": "39984637", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49804687797834835, "ground_truth": 0}, {"key": "39984637", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32939170512312543, "ground_truth": 0}, {"key": "39984637", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.548673499168915, "ground_truth": 0}, {"key": "17917326", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.509764394612303, "ground_truth": 0}, {"key": "17917326", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3208213145310456, "ground_truth": 0}, {"key": "17917326", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7634837559974981, "ground_truth": 0}, {"key": "17917326", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033633102586, "ground_truth": 0}, {"key": "17917326", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47657962865912035, "ground_truth": 0}, {"key": "32193638", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7476159641500681, "ground_truth": 0}, {"key": "32193638", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6926419722133166, "ground_truth": 0}, {"key": "32193638", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7371581662036508, "ground_truth": 0}, {"key": "32193638", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581516434854, "ground_truth": 0}, {"key": "32193638", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.724870266271119, "ground_truth": 0}, {"key": "34564692", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7690802168936499, "ground_truth": 0}, {"key": "34564692", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8233283970068629, "ground_truth": 0}, {"key": "34564692", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8333245896182097, "ground_truth": 0}, {"key": "34564692", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.870597265309535, "ground_truth": 0}, {"key": "34564692", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089099774632, "ground_truth": 0}, {"key": "39329284", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9666631762442361, "ground_truth": 0}, {"key": "39329284", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8816149035014164, "ground_truth": 0}, {"key": "39329284", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9582261211927577, "ground_truth": 0}, {"key": "39329284", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9606574951002648, "ground_truth": 0}, {"key": "39329284", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9575961709041227, "ground_truth": 0}, {"key": "37438541", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6842640199663764, "ground_truth": 0}, {"key": "37438541", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5389832372562934, "ground_truth": 0}, {"key": "37438541", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4765796261363252, "ground_truth": 0}, {"key": "37438541", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676346869891964, "ground_truth": 0}, {"key": "37438541", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586029657273, "ground_truth": 0}, {"key": "34652757", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8568122922159147, "ground_truth": 0}, {"key": "34652757", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7956580904749402, "ground_truth": 0}, {"key": "34652757", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8577681163926065, "ground_truth": 0}, {"key": "34652757", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587186031808206, "ground_truth": 0}, {"key": "34652757", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145755697689, "ground_truth": 0}, {"key": "31361004", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7956581050225696, "ground_truth": 0}, {"key": "31361004", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757646027222763, "ground_truth": 0}, {"key": "31361004", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8740772299885743, "ground_truth": 0}, {"key": "31361004", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274181501697, "ground_truth": 0}, {"key": "31361004", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352771507427, "ground_truth": 0}, {"key": "26150727", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2766905349449189, "ground_truth": 0}, {"key": "26150727", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.37570647704948784, "ground_truth": 0}, {"key": "26150727", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39420092994662265, "ground_truth": 0}, {"key": "26150727", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3665897523288381, "ground_truth": 0}, {"key": "26150727", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474602890531267, "ground_truth": 0}, {"key": "36997402", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7606506462336968, "ground_truth": 0}, {"key": "36997402", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7122321821391363, "ground_truth": 0}, {"key": "36997402", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.790530296601571, "ground_truth": 0}, {"key": "36997402", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303175162702, "ground_truth": 0}, {"key": "36997402", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441113973168, "ground_truth": 0}, {"key": "37430643", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5409238705099009, "ground_truth": 0}, {"key": "37430643", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6001883658683279, "ground_truth": 0}, {"key": "37430643", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7386690920926837, "ground_truth": 0}, {"key": "37430643", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746097994424, "ground_truth": 0}, {"key": "37430643", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085703993821, "ground_truth": 0}, {"key": "36964631", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7279754769685283, "ground_truth": 0}, {"key": "36964631", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8824278590562032, "ground_truth": 0}, {"key": "36964631", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7918210594080658, "ground_truth": 0}, {"key": "36964631", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738058968869, "ground_truth": 0}, {"key": "36964631", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740260200334, "ground_truth": 0}, {"key": "35502013", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8164063941402774, "ground_truth": 0}, {"key": "35502013", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6242935592875541, "ground_truth": 0}, {"key": "35502013", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7461390052556602, "ground_truth": 0}, {"key": "35502013", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445677421585, "ground_truth": 0}, {"key": "35502013", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253893078183, "ground_truth": 0}, {"key": "33987664", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8386797633443204, "ground_truth": 0}, {"key": "33987664", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9111797119257284, "ground_truth": 0}, {"key": "33987664", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8705972664869908, "ground_truth": 0}, {"key": "33987664", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972761815309, "ground_truth": 0}, {"key": "33987664", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267118024541857, "ground_truth": 0}, {"key": "35203721", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4746311752122657, "ground_truth": 0}, {"key": "35203721", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6654105600861884, "ground_truth": 0}, {"key": "35203721", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5832033656765209, "ground_truth": 0}, {"key": "35203721", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852886299924124, "ground_truth": 0}, {"key": "35203721", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891376582249, "ground_truth": 0}, {"key": "39028348", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8210441207226288, "ground_truth": 0}, {"key": "39028348", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7563575596368298, "ground_truth": 0}, {"key": "39028348", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8529354806902039, "ground_truth": 0}, {"key": "39028348", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619269387031, "ground_truth": 0}, {"key": "39028348", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891250084358, "ground_truth": 0}, {"key": "37459383", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8791467782291766, "ground_truth": 0}, {"key": "37459383", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8128673251749852, "ground_truth": 0}, {"key": "37459383", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8438951081476989, "ground_truth": 0}, {"key": "37459383", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894603408579, "ground_truth": 0}, {"key": "37459383", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951123710404, "ground_truth": 0}, {"key": "34020070", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575750584912, "ground_truth": 0}, {"key": "34020070", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7592254051716674, "ground_truth": 0}, {"key": "34020070", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7839884554162628, "ground_truth": 0}, {"key": "34020070", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358456831146, "ground_truth": 0}, {"key": "34020070", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389922191383, "ground_truth": 0}, {"key": "35176615", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7057850038815375, "ground_truth": 0}, {"key": "35176615", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7106282889975535, "ground_truth": 0}, {"key": "35176615", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5813030876969806, "ground_truth": 0}, {"key": "35176615", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953363710903, "ground_truth": 0}, {"key": "35176615", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936424238208, "ground_truth": 0}, {"key": "33296389", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9155072466876888, "ground_truth": 0}, {"key": "33296389", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085911838186, "ground_truth": 0}, {"key": "33296389", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7905303168353414, "ground_truth": 0}, {"key": "33296389", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9353465112275469, "ground_truth": 0}, {"key": "33296389", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568123036698795, "ground_truth": 0}, {"key": "35399504", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9621075778924956, "ground_truth": 0}, {"key": "35399504", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9773708004362215, "ground_truth": 0}, {"key": "35399504", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9441768592779123, "ground_truth": 0}, {"key": "35399504", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9651191138211277, "ground_truth": 0}, {"key": "35399504", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9615338072374546, "ground_truth": 0}, {"key": "34807886", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "34807886", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3684056880604311, "ground_truth": 0}, {"key": "34807886", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3007455940149272, "ground_truth": 0}, {"key": "34807886", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32594952786613496, "ground_truth": 0}, {"key": "34807886", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.329391727984714, "ground_truth": 0}, {"key": "37629813", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7025300818510815, "ground_truth": 0}, {"key": "37629813", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5563995734086836, "ground_truth": 0}, {"key": "37629813", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7057850463668992, "ground_truth": 0}, {"key": "37629813", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506536037216, "ground_truth": 0}, {"key": "37629813", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014027329537, "ground_truth": 0}, {"key": "28084389", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4590761562603945, "ground_truth": 0}, {"key": "28084389", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8019358367244105, "ground_truth": 0}, {"key": "28084389", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7879311800406738, "ground_truth": 0}, {"key": "28084389", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.910545388643555, "ground_truth": 0}, {"key": "28084389", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757870059626961, "ground_truth": 0}, {"key": "35391734", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7431680115934788, "ground_truth": 0}, {"key": "35391734", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8244619313185996, "ground_truth": 0}, {"key": "35391734", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8807970746785506, "ground_truth": 0}, {"key": "35391734", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.814052794269421, "ground_truth": 0}, {"key": "35391734", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343807189991, "ground_truth": 0}, {"key": "40214591", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6279512209095413, "ground_truth": 0}, {"key": "40214591", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8128673260882457, "ground_truth": 0}, {"key": "40214591", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4765796139927624, "ground_truth": 0}, {"key": "40214591", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102666824744, "ground_truth": 0}, {"key": "40214591", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241494018956, "ground_truth": 0}, {"key": "26283171", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8116760160843078, "ground_truth": 0}, {"key": "26283171", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8333245931365725, "ground_truth": 0}, {"key": "26283171", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170118909058639, "ground_truth": 0}, {"key": "26283171", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998561905704, "ground_truth": 0}, {"key": "26283171", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059181517246, "ground_truth": 0}, {"key": "37084030", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.22405545151850131, "ground_truth": 0}, {"key": "37084030", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4687906323937486, "ground_truth": 0}, {"key": "37084030", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2643583399703649, "ground_truth": 0}, {"key": "37084030", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26435836645572697, "ground_truth": 0}, {"key": "37084030", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3242354091754312, "ground_truth": 0}, {"key": "39027295", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.32766829791849233, "ground_truth": 0}, {"key": "39027295", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.30569731720885546, "ground_truth": 0}, {"key": "39027295", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5039061864430258, "ground_truth": 0}, {"key": "39027295", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.554470495609095, "ground_truth": 0}, {"key": "39027295", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632760781189, "ground_truth": 0}, {"key": "14018647", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.305697319294364, "ground_truth": 0}, {"key": "14018647", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39606817126122545, "ground_truth": 0}, {"key": "14018647", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41489886325671316, "ground_truth": 0}, {"key": "14018647", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782568114682995, "ground_truth": 0}, {"key": "14018647", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2422056239690069, "ground_truth": 0}, {"key": "37424289", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9149009546822531, "ground_truth": 0}, {"key": "37424289", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.985271385311396, "ground_truth": 0}, {"key": "37424289", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9536217909950006, "ground_truth": 0}, {"key": "37424289", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9787126456896629, "ground_truth": 0}, {"key": "37424289", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.924687689899144, "ground_truth": 0}, {"key": "37498031", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6909763104623345, "ground_truth": 0}, {"key": "37498031", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8568122934315262, "ground_truth": 0}, {"key": "37498031", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5851011513779081, "ground_truth": 0}, {"key": "37498031", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.888758783538165, "ground_truth": 0}, {"key": "37498031", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786925215094, "ground_truth": 0}, {"key": "30104095", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8354835327591489, "ground_truth": 0}, {"key": "30104095", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6959583431047638, "ground_truth": 0}, {"key": "30104095", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575494005871, "ground_truth": 0}, {"key": "30104095", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837534639798, "ground_truth": 0}, {"key": "30104095", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.794384962868664, "ground_truth": 0}, {"key": "37911407", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8816149135111451, "ground_truth": 0}, {"key": "37911407", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9416541621402456, "ground_truth": 0}, {"key": "37911407", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9543079704485071, "ground_truth": 0}, {"key": "37911407", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9648551530007022, "ground_truth": 0}, {"key": "37911407", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9477691453872765, "ground_truth": 0}, {"key": "39177472", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8539127488680015, "ground_truth": 0}, {"key": "39177472", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8175744837164268, "ground_truth": 0}, {"key": "39177472", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8679338557038572, "ground_truth": 0}, {"key": "39177472", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619188828847, "ground_truth": 0}, {"key": "39177472", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493031557822, "ground_truth": 0}, {"key": "32325454", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8679338438061198, "ground_truth": 0}, {"key": "32325454", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9294404060496728, "ground_truth": 0}, {"key": "32325454", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9142907279195956, "ground_truth": 0}, {"key": "32325454", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686244433643, "ground_truth": 0}, {"key": "32325454", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110462828912, "ground_truth": 0}, {"key": "38395319", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8267117861348702, "ground_truth": 0}, {"key": "38395319", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8210441160216047, "ground_truth": 0}, {"key": "38395319", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7356416533172435, "ground_truth": 0}, {"key": "38395319", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312139324534, "ground_truth": 0}, {"key": "38395319", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281495316984, "ground_truth": 0}, {"key": "38235895", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5888891118433234, "ground_truth": 0}, {"key": "38235895", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717666226145884, "ground_truth": 0}, {"key": "38235895", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4824291107128844, "ground_truth": 0}, {"key": "38235895", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199220361208, "ground_truth": 0}, {"key": "38235895", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441200678947044, "ground_truth": 0}, {"key": "26543267", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4016878003412055, "ground_truth": 0}, {"key": "26543267", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4092207841896219, "ground_truth": 0}, {"key": "26543267", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5563995853917325, "ground_truth": 0}, {"key": "26543267", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204877977973827, "ground_truth": 0}, {"key": "26543267", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894524726805, "ground_truth": 0}, {"key": "39054728", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9920620059665823, "ground_truth": 0}, {"key": "39054728", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9763105310576415, "ground_truth": 0}, {"key": "39054728", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9730364985520801, "ground_truth": 0}, {"key": "39054728", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.991422514598288, "ground_truth": 0}, {"key": "39054728", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.970909241670396, "ground_truth": 0}, {"key": "39158443", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8791467629615235, "ground_truth": 0}, {"key": "39158443", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7813306340245519, "ground_truth": 0}, {"key": "39158443", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8661325179632585, "ground_truth": 0}, {"key": "39158443", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528022912138, "ground_truth": 0}, {"key": "39158443", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544132766294, "ground_truth": 0}, {"key": "36254201", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40733338388186496, "ground_truth": 0}, {"key": "36254201", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40168777495333413, "ground_truth": 0}, {"key": "36254201", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4980468726795576, "ground_truth": 0}, {"key": "36254201", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121329248826, "ground_truth": 0}, {"key": "36254201", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734868835711, "ground_truth": 0}, {"key": "23434347", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199464124396, "ground_truth": 0}, {"key": "23434347", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3849121411251676, "ground_truth": 0}, {"key": "23434347", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6876299928628979, "ground_truth": 0}, {"key": "23434347", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251188173735, "ground_truth": 0}, {"key": "23434347", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.764891627393685, "ground_truth": 0}, {"key": "34397620", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4980469101997098, "ground_truth": 0}, {"key": "34397620", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4225046058465931, "ground_truth": 0}, {"key": "34397620", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5117165912338726, "ground_truth": 0}, {"key": "34397620", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061614636625, "ground_truth": 0}, {"key": "34397620", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4902355961010068, "ground_truth": 0}, {"key": "34340916", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419650195491, "ground_truth": 0}, {"key": "34340916", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4073334090549043, "ground_truth": 0}, {"key": "34340916", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6095241617753321, "ground_truth": 0}, {"key": "34340916", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241700373062, "ground_truth": 0}, {"key": "34340916", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061851793292, "ground_truth": 0}, {"key": "30375089", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7371581744498765, "ground_truth": 0}, {"key": "30375089", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5097643851228989, "ground_truth": 0}, {"key": "30375089", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6825737162545978, "ground_truth": 0}, {"key": "30375089", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837866346682, "ground_truth": 0}, {"key": "30375089", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461390000942457, "ground_truth": 0}, {"key": "35807797", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9005297955086066, "ground_truth": 0}, {"key": "35807797", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6460136818142523, "ground_truth": 0}, {"key": "35807797", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9005297845883257, "ground_truth": 0}, {"key": "35807797", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105685933153, "ground_truth": 0}, {"key": "35807797", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.907312215862992, "ground_truth": 0}, {"key": "34188172", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7264255957466846, "ground_truth": 0}, {"key": "34188172", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "34188172", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7620700922603793, "ground_truth": 0}, {"key": "34188172", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224597244005, "ground_truth": 0}, {"key": "34188172", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199095756048, "ground_truth": 0}, {"key": "37075567", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8879840492681919, "ground_truth": 0}, {"key": "37075567", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9299510471855005, "ground_truth": 0}, {"key": "37075567", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9511422117383919, "ground_truth": 0}, {"key": "37075567", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549553294648, "ground_truth": 0}, {"key": "37075567", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009524615535, "ground_truth": 0}, {"key": "35559735", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8322366449193812, "ground_truth": 0}, {"key": "35559735", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8697146013204222, "ground_truth": 0}, {"key": "35559735", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.865224086566841, "ground_truth": 0}, {"key": "35559735", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419739804954, "ground_truth": 0}, {"key": "35559735", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253745754722, "ground_truth": 0}, {"key": "33005019", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.523420366559811, "ground_truth": 0}, {"key": "33005019", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5506073707733709, "ground_truth": 0}, {"key": "33005019", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6740504664252502, "ground_truth": 0}, {"key": "33005019", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702734375816, "ground_truth": 0}, {"key": "33005019", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224477620226, "ground_truth": 0}, {"key": "30808252", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6169358038800201, "ground_truth": 0}, {"key": "30808252", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5428632938284902, "ground_truth": 0}, {"key": "30808252", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6671476751913089, "ground_truth": 0}, {"key": "30808252", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504703639858, "ground_truth": 0}, {"key": "30808252", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244119922419277, "ground_truth": 0}, {"key": "15159017", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7264255917230643, "ground_truth": 0}, {"key": "15159017", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.866132509372248, "ground_truth": 0}, {"key": "15159017", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8643104468187702, "ground_truth": 0}, {"key": "15159017", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068872700605, "ground_truth": 0}, {"key": "15159017", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.823328399940816, "ground_truth": 0}, {"key": "24493400", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6531269183729577, "ground_truth": 0}, {"key": "24493400", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.48438009036897284, "ground_truth": 0}, {"key": "24493400", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.700894825354931, "ground_truth": 0}, {"key": "24493400", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168781320421615, "ground_truth": 0}, {"key": "24493400", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389727057419, "ground_truth": 0}, {"key": "37791071", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8807970736959808, "ground_truth": 0}, {"key": "37791071", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8187367901514095, "ground_truth": 0}, {"key": "37791071", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9381240166513992, "ground_truth": 0}, {"key": "37791071", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206736819914, "ground_truth": 0}, {"key": "37791071", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127515423272, "ground_truth": 0}, {"key": "33528627", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8080672085259041, "ground_truth": 0}, {"key": "33528627", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7786493316570973, "ground_truth": 0}, {"key": "33528627", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.864310445012266, "ground_truth": 0}, {"key": "33528627", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802522311884, "ground_truth": 0}, {"key": "33528627", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797610571465, "ground_truth": 0}, {"key": "39925662", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9099070005599991, "ground_truth": 0}, {"key": "39925662", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9453993882786907, "ground_truth": 0}, {"key": "39925662", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9319595821740115, "ground_truth": 0}, {"key": "39925662", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288442555543, "ground_truth": 0}, {"key": "39925662", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743576337393, "ground_truth": 0}, {"key": "29213416", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3007455595830851, "ground_truth": 0}, {"key": "29213416", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7041601271389968, "ground_truth": 0}, {"key": "29213416", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984594827746, "ground_truth": 0}, {"key": "29213416", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832299107071, "ground_truth": 0}, {"key": "29213416", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121406621907, "ground_truth": 0}, {"key": "34492745", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4610168126618978, "ground_truth": 0}, {"key": "34492745", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3451052736989346, "ground_truth": 0}, {"key": "34492745", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5136684776460999, "ground_truth": 0}, {"key": "34492745", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835415618274, "ground_truth": 0}, {"key": "34492745", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125811211699, "ground_truth": 0}, {"key": "34191937", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6206216438128546, "ground_truth": 0}, {"key": "34191937", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3793783551606531, "ground_truth": 0}, {"key": "34191937", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.644225112923692, "ground_truth": 0}, {"key": "34191937", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631560495553, "ground_truth": 0}, {"key": "34191937", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926420005986853, "ground_truth": 0}, {"key": "34933372", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8840392785584049, "ground_truth": 0}, {"key": "34933372", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8489721945829063, "ground_truth": 0}, {"key": "34933372", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7534666551638034, "ground_truth": 0}, {"key": "34933372", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545674583116, "ground_truth": 0}, {"key": "34933372", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.801935838786871, "ground_truth": 0}, {"key": "38714379", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.957277801938423, "ground_truth": 0}, {"key": "38714379", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9235923155306088, "ground_truth": 0}, {"key": "38714379", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9676556682435559, "ground_truth": 0}, {"key": "38714379", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9594592616119477, "ground_truth": 0}, {"key": "38714379", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9314625119419213, "ground_truth": 0}, {"key": "39220660", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8198933305847724, "ground_truth": 0}, {"key": "39220660", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9566342005115523, "ground_truth": 0}, {"key": "39220660", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8976952914711742, "ground_truth": 0}, {"key": "39220660", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898100230657, "ground_truth": 0}, {"key": "39220660", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424261069651, "ground_truth": 0}, {"key": "41028780", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6601723719381818, "ground_truth": 0}, {"key": "41028780", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8278281585607745, "ground_truth": 0}, {"key": "41028780", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7634837666900646, "ground_truth": 0}, {"key": "41028780", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321915410964, "ground_truth": 0}, {"key": "41028780", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531268983927131, "ground_truth": 0}, {"key": "39457108", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.741674024309181, "ground_truth": 0}, {"key": "39457108", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.30239109526160074, "ground_truth": 0}, {"key": "39457108", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5964331414300394, "ground_truth": 0}, {"key": "39457108", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241888376647, "ground_truth": 0}, {"key": "39457108", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321622349461, "ground_truth": 0}, {"key": "38288018", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2068940505388845, "ground_truth": 0}, {"key": "38288018", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.29746995522678465, "ground_truth": 0}, {"key": "38288018", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.14318771548308842, "ground_truth": 0}, {"key": "38288018", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740816335036877, "ground_truth": 0}, {"key": "38288018", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709894888898, "ground_truth": 0}, {"key": "40106293", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3468730884351386, "ground_truth": 0}, {"key": "40106293", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31912138775611126, "ground_truth": 0}, {"key": "40106293", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40356690331177214, "ground_truth": 0}, {"key": "40106293", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3293917221977579, "ground_truth": 0}, {"key": "40106293", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742625248233824, "ground_truth": 0}, {"key": "39948797", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7401743575388562, "ground_truth": 0}, {"key": "39948797", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9653811628014889, "ground_truth": 0}, {"key": "39948797", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7090191066445843, "ground_truth": 0}, {"key": "39948797", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441027506452, "ground_truth": 0}, {"key": "39948797", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145909324463, "ground_truth": 0}, {"key": "31853399", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.925229956504073, "ground_truth": 0}, {"key": "31853399", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791787254451875, "ground_truth": 0}, {"key": "31853399", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8998277729197542, "ground_truth": 0}, {"key": "31853399", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587970404133, "ground_truth": 0}, {"key": "31853399", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.883235981027517, "ground_truth": 0}, {"key": "35273252", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.21601154823073343, "ground_truth": 0}, {"key": "35273252", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.48047867604869626, "ground_truth": 0}, {"key": "35273252", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6566582997801818, "ground_truth": 0}, {"key": "35273252", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689404967447514, "ground_truth": 0}, {"key": "35273252", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793784171205912, "ground_truth": 0}, {"key": "37130459", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9278877875268864, "ground_truth": 0}, {"key": "37130459", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9844563523810728, "ground_truth": 0}, {"key": "37130459", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9111797159972762, "ground_truth": 0}, {"key": "37130459", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.909907013188103, "ground_truth": 0}, {"key": "37130459", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9804313242921799, "ground_truth": 0}, {"key": "21734003", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7461389877316514, "ground_truth": 0}, {"key": "21734003", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9026096072229784, "ground_truth": 0}, {"key": "21734003", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8300437729420089, "ground_truth": 0}, {"key": "21734003", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343673003412, "ground_truth": 0}, {"key": "21734003", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511495315012, "ground_truth": 0}, {"key": "33990737", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6876300011741354, "ground_truth": 0}, {"key": "33990737", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6206216045251098, "ground_truth": 0}, {"key": "33990737", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056102103154, "ground_truth": 0}, {"key": "33990737", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132649451878665, "ground_truth": 0}, {"key": "33990737", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754743680303, "ground_truth": 0}, {"key": "34559912", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9224823450673426, "ground_truth": 0}, {"key": "34559912", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8955226734314973, "ground_truth": 0}, {"key": "34559912", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8322366511694864, "ground_truth": 0}, {"key": "34559912", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346140323044, "ground_truth": 0}, {"key": "34559912", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366494679175, "ground_truth": 0}, {"key": "39820439", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1968262035089663, "ground_truth": 0}, {"key": "39820439", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.41679663841275916, "ground_truth": 0}, {"key": "39820439", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5058591135281858, "ground_truth": 0}, {"key": "39820439", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3629692087118535, "ground_truth": 0}, {"key": "39820439", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2798285141792944, "ground_truth": 0}, {"key": "34759328", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9362850128824357, "ground_truth": 0}, {"key": "34759328", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9678992966870883, "ground_truth": 0}, {"key": "34759328", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9728307677629403, "ground_truth": 0}, {"key": "34759328", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.952925819610713, "ground_truth": 0}, {"key": "34759328", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9403530536944575, "ground_truth": 0}, {"key": "36939137", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7325918449903586, "ground_truth": 0}, {"key": "36939137", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948093038467, "ground_truth": 0}, {"key": "36939137", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.605799047033793, "ground_truth": 0}, {"key": "36939137", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148331554538, "ground_truth": 0}, {"key": "36939137", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545687624251, "ground_truth": 0}, {"key": "35851522", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7786493043275069, "ground_truth": 0}, {"key": "35851522", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7310585807046773, "ground_truth": 0}, {"key": "35851522", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6909762962008847, "ground_truth": 0}, {"key": "35851522", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948319568571, "ground_truth": 0}, {"key": "35851522", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689358360218, "ground_truth": 0}, {"key": "22412782", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8643104524395568, "ground_truth": 0}, {"key": "22412782", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6654105567904339, "ground_truth": 0}, {"key": "22412782", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7943849553784235, "ground_truth": 0}, {"key": "22412782", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333246100397718, "ground_truth": 0}, {"key": "22412782", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748582207441, "ground_truth": 0}, {"key": "38579227", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9079671372641205, "ground_truth": 0}, {"key": "38579227", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9196425341893161, "ground_truth": 0}, {"key": "38579227", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9202179925829236, "ground_truth": 0}, {"key": "38579227", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.853912760968873, "ground_truth": 0}, {"key": "38579227", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9257686323542866, "ground_truth": 0}, {"key": "37206995", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8221891357235579, "ground_truth": 0}, {"key": "37206995", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9207896798813241, "ground_truth": 0}, {"key": "37206995", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7772998788194275, "ground_truth": 0}, {"key": "37206995", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.887204592104421, "ground_truth": 0}, {"key": "37206995", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744799411822, "ground_truth": 0}, {"key": "38700847", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8969755791497976, "ground_truth": 0}, {"key": "38700847", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8499711715118797, "ground_truth": 0}, {"key": "38700847", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9118099543256337, "ground_truth": 0}, {"key": "38700847", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297884198455, "ground_truth": 0}, {"key": "38700847", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338424581975, "ground_truth": 0}, {"key": "20246590", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9910145709379473, "ground_truth": 0}, {"key": "20246590", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9939964043506861, "ground_truth": 0}, {"key": "20246590", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.986979509696693, "ground_truth": 0}, {"key": "20246590", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9808759628764009, "ground_truth": 0}, {"key": "20246590", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9801292862986044, "ground_truth": 0}, {"key": "39141360", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8606036230724569, "ground_truth": 0}, {"key": "39141360", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.638835294415259, "ground_truth": 0}, {"key": "39141360", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8976952807900138, "ground_truth": 0}, {"key": "39141360", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511582888627, "ground_truth": 0}, {"key": "39141360", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423313264319, "ground_truth": 0}, {"key": "37906226", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6671476856022781, "ground_truth": 0}, {"key": "37906226", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6057990516414722, "ground_truth": 0}, {"key": "37906226", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4167966131831867, "ground_truth": 0}, {"key": "37906226", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819798119049, "ground_truth": 0}, {"key": "37906226", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384267155241, "ground_truth": 0}, {"key": "16201033", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5273165486229722, "ground_truth": 0}, {"key": "16201033", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6352224552042463, "ground_truth": 0}, {"key": "16201033", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6943026857674593, "ground_truth": 0}, {"key": "16201033", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228835835589, "ground_truth": 0}, {"key": "16201033", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089065688941, "ground_truth": 0}, {"key": "36469022", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5698526411609408, "ground_truth": 0}, {"key": "36469022", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5097643768225218, "ground_truth": 0}, {"key": "36469022", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5506073715200289, "ground_truth": 0}, {"key": "36469022", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.699254427714734, "ground_truth": 0}, {"key": "36469022", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.476579664797739, "ground_truth": 0}, {"key": "31295270", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.20946969087912728, "ground_truth": 0}, {"key": "31295270", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2798284762164672, "ground_truth": 0}, {"key": "31295270", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.21337717026025005, "ground_truth": 0}, {"key": "31295270", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32423540141790513, "ground_truth": 0}, {"key": "31295270", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3056973219938983, "ground_truth": 0}, {"key": "35360689", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.48828337930161186, "ground_truth": 0}, {"key": "35360689", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.37570647796991985, "ground_truth": 0}, {"key": "35360689", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4629586256934586, "ground_truth": 0}, {"key": "35360689", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32939170004505686, "ground_truth": 0}, {"key": "35360689", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.509764382987446, "ground_truth": 0}, {"key": "29202793", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4551985751757631, "ground_truth": 0}, {"key": "29202793", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.22541660838191685, "ground_truth": 0}, {"key": "29202793", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5448013936040242, "ground_truth": 0}, {"key": "29202793", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653334912340175, "ground_truth": 0}, {"key": "29202793", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108765191848, "ground_truth": 0}, {"key": "35999008", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419908263058, "ground_truth": 0}, {"key": "35999008", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5640984860057787, "ground_truth": 0}, {"key": "35999008", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575612175365, "ground_truth": 0}, {"key": "35999008", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551985803987985, "ground_truth": 0}, {"key": "35999008", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269105458497, "ground_truth": 0}, {"key": "31797119", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7476159487282608, "ground_truth": 0}, {"key": "31797119", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.848972212145, "ground_truth": 0}, {"key": "31797119", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7620701244271089, "ground_truth": 0}, {"key": "31797119", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199541049631, "ground_truth": 0}, {"key": "31797119", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972649010327, "ground_truth": 0}, {"key": "26711893", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7008947973643386, "ground_truth": 0}, {"key": "26711893", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757645946298535, "ground_truth": 0}, {"key": "26711893", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.803173813248248, "ground_truth": 0}, {"key": "26711893", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.592666579823038, "ground_truth": 0}, {"key": "26711893", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352616470889, "ground_truth": 0}, {"key": "35348288", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832110662754, "ground_truth": 0}, {"key": "35348288", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.48438010558734296, "ground_truth": 0}, {"key": "35348288", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5525396970446007, "ground_truth": 0}, {"key": "35348288", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880048426424, "ground_truth": 0}, {"key": "35348288", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014072914581, "ground_truth": 0}, {"key": "38124131", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.27825680334959274, "ground_truth": 0}, {"key": "38124131", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.16885694014397482, "ground_truth": 0}, {"key": "38124131", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2133771684220243, "ground_truth": 0}, {"key": "38124131", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3040416728780534, "ground_truth": 0}, {"key": "38124131", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2081789416839345, "ground_truth": 0}, {"key": "20285901", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7217432095184724, "ground_truth": 0}, {"key": "20285901", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6224593238546515, "ground_truth": 0}, {"key": "20285901", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7090191354889996, "ground_truth": 0}, {"key": "20285901", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702928032047, "ground_truth": 0}, {"key": "20285901", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185806001099, "ground_truth": 0}, {"key": "35633632", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7969253772515427, "ground_truth": 0}, {"key": "35633632", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6566582767904576, "ground_truth": 0}, {"key": "35633632", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7279754435547583, "ground_truth": 0}, {"key": "35633632", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943754147675, "ground_truth": 0}, {"key": "35633632", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898623715804, "ground_truth": 0}, {"key": "10741274", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.23370634730922438, "ground_truth": 0}, {"key": "10741274", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6242935267903666, "ground_truth": 0}, {"key": "10741274", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41111086299596783, "ground_truth": 0}, {"key": "10741274", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181322549366315, "ground_truth": 0}, {"key": "10741274", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193277122933552, "ground_truth": 0}, {"key": "30605795", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031738042775516, "ground_truth": 0}, {"key": "30605795", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948056950243, "ground_truth": 0}, {"key": "30605795", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7310585758621834, "ground_truth": 0}, {"key": "30605795", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307433913882, "ground_truth": 0}, {"key": "30605795", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.567936588039365, "ground_truth": 0}, {"key": "30539722", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7356416323995877, "ground_truth": 0}, {"key": "30539722", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5679365918395702, "ground_truth": 0}, {"key": "30539722", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "30539722", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802274401647, "ground_truth": 0}, {"key": "30539722", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964186022671, "ground_truth": 0}, {"key": "18639299", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4378234845465017, "ground_truth": 0}, {"key": "18639299", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2845759932939866, "ground_truth": 0}, {"key": "18639299", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41869690816554034, "ground_truth": 0}, {"key": "18639299", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669052780040276, "ground_truth": 0}, {"key": "18639299", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910516603274667, "ground_truth": 0}, {"key": "39773552", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7248702579921532, "ground_truth": 0}, {"key": "39773552", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085811200843, "ground_truth": 0}, {"key": "39773552", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490872130494781, "ground_truth": 0}, {"key": "39773552", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740397326406, "ground_truth": 0}, {"key": "39773552", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195367181474, "ground_truth": 0}, {"key": "34086410", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4824290990487757, "ground_truth": 0}, {"key": "34086410", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.37754067082626525, "ground_truth": 0}, {"key": "34086410", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4148988582861901, "ground_truth": 0}, {"key": "34086410", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658971322241524, "ground_truth": 0}, {"key": "34086410", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.687629993490795, "ground_truth": 0}, {"key": "35454652", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7648916096264136, "ground_truth": 0}, {"key": "35454652", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8679338512948672, "ground_truth": 0}, {"key": "35454652", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7185943993421251, "ground_truth": 0}, {"key": "35454652", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869865031724, "ground_truth": 0}, {"key": "35454652", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619304200036, "ground_truth": 0}, {"key": "36158310", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8539127347112542, "ground_truth": 0}, {"key": "36158310", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4824291121536873, "ground_truth": 0}, {"key": "36158310", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8311430630465287, "ground_truth": 0}, {"key": "36158310", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721948582134, "ground_truth": 0}, {"key": "36158310", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601506063422, "ground_truth": 0}, {"key": "35688387", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4416730190803021, "ground_truth": 0}, {"key": "35688387", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8152324834309331, "ground_truth": 0}, {"key": "35688387", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1623800281796262, "ground_truth": 0}, {"key": "35688387", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4707366202911817, "ground_truth": 0}, {"key": "35688387", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.18713268488524548, "ground_truth": 0}, {"key": "34209292", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8962513753558008, "ground_truth": 0}, {"key": "34209292", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7431680055847308, "ground_truth": 0}, {"key": "34209292", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8840392852250841, "ground_truth": 0}, {"key": "34209292", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357619799134, "ground_truth": 0}, {"key": "34209292", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357700210757, "ground_truth": 0}, {"key": "25037859", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5097644159570212, "ground_truth": 0}, {"key": "25037859", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4863315260331782, "ground_truth": 0}, {"key": "25037859", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5563995728341292, "ground_truth": 0}, {"key": "25037859", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318467015925, "ground_truth": 0}, {"key": "25037859", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544100627894, "ground_truth": 0}, {"key": "36412121", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8714748600830095, "ground_truth": 0}, {"key": "36412121", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8984105587414616, "ground_truth": 0}, {"key": "36412121", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.869714577731255, "ground_truth": 0}, {"key": "36412121", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218414680231, "ground_truth": 0}, {"key": "36412121", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9334308123216325, "ground_truth": 0}, {"key": "34909172", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7839884718816305, "ground_truth": 0}, {"key": "34909172", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7563575613172892, "ground_truth": 0}, {"key": "34909172", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.846957846314431, "ground_truth": 0}, {"key": "34909172", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338383265581, "ground_truth": 0}, {"key": "34909172", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416739790402679, "ground_truth": 0}, {"key": "39011806", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7943849598652022, "ground_truth": 0}, {"key": "39011806", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9184802415829222, "ground_truth": 0}, {"key": "39011806", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8624675320957222, "ground_truth": 0}, {"key": "39011806", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745062293655, "ground_truth": 0}, {"key": "39011806", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740275384576, "ground_truth": 0}, {"key": "33096163", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7248702840172302, "ground_truth": 0}, {"key": "33096163", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8984105616585217, "ground_truth": 0}, {"key": "33096163", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9142907291576601, "ground_truth": 0}, {"key": "33096163", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673114779774, "ground_truth": 0}, {"key": "33096163", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802692228899, "ground_truth": 0}, {"key": "38762205", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8872046076102743, "ground_truth": 0}, {"key": "38762205", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9615338098682302, "ground_truth": 0}, {"key": "38762205", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8479677532039351, "ground_truth": 0}, {"key": "38762205", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9294404027440204, "ground_truth": 0}, {"key": "38762205", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.907967138336453, "ground_truth": 0}, {"key": "35519177", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.763483753053142, "ground_truth": 0}, {"key": "35519177", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6636689427970567, "ground_truth": 0}, {"key": "35519177", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9469902336361274, "ground_truth": 0}, {"key": "35519177", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835462412402, "ground_truth": 0}, {"key": "35519177", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737906855572, "ground_truth": 0}, {"key": "36192531", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6113819556029809, "ground_truth": 0}, {"key": "36192531", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6224593104205569, "ground_truth": 0}, {"key": "36192531", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984605053609, "ground_truth": 0}, {"key": "36192531", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251265695195, "ground_truth": 0}, {"key": "36192531", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916155213266, "ground_truth": 0}, {"key": "33160852", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8723473702134359, "ground_truth": 0}, {"key": "33160852", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8519527910580125, "ground_truth": 0}, {"key": "33160852", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.913058340253902, "ground_truth": 0}, {"key": "33160852", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9621075724086112, "ground_truth": 0}, {"key": "33160852", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9575961721081877, "ground_truth": 0}, {"key": "36312304", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6113819466666541, "ground_truth": 0}, {"key": "36312304", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.55060735004815, "ground_truth": 0}, {"key": "36312304", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49414092430021556, "ground_truth": 0}, {"key": "36312304", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216354689896, "ground_truth": 0}, {"key": "36312304", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762984672456, "ground_truth": 0}, {"key": "33773343", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49804686158955336, "ground_truth": 0}, {"key": "33773343", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5389832142691321, "ground_truth": 0}, {"key": "33773343", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5019531083692135, "ground_truth": 0}, {"key": "33773343", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203809395167, "ground_truth": 0}, {"key": "33773343", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111085188550034, "ground_truth": 0}, {"key": "34913320", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5832033549867387, "ground_truth": 0}, {"key": "34913320", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5621764973922593, "ground_truth": 0}, {"key": "34913320", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7356416367089949, "ground_truth": 0}, {"key": "34913320", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.769080252253687, "ground_truth": 0}, {"key": "34913320", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416562764353, "ground_truth": 0}, {"key": "33784155", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8615382193151893, "ground_truth": 0}, {"key": "33784155", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8221891373074867, "ground_truth": 0}, {"key": "33784155", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704647837568673, "ground_truth": 0}, {"key": "33784155", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149933331856, "ground_truth": 0}, {"key": "33784155", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802475349241, "ground_truth": 0}, {"key": "24085062", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9746286878389301, "ground_truth": 0}, {"key": "24085062", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9968763512572463, "ground_truth": 0}, {"key": "24085062", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9681411443371564, "ground_truth": 0}, {"key": "24085062", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9773708023411765, "ground_truth": 0}, {"key": "24085062", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9890130564925395, "ground_truth": 0}, {"key": "33893487", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3311197315401708, "ground_truth": 0}, {"key": "33893487", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.15405755395854065, "ground_truth": 0}, {"key": "33893487", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.34510525800722813, "ground_truth": 0}, {"key": "33893487", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684421225366, "ground_truth": 0}, {"key": "33893487", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199272395133, "ground_truth": 0}, {"key": "40913011", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9012274178653098, "ground_truth": 0}, {"key": "40913011", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9257686305079845, "ground_truth": 0}, {"key": "40913011", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9173026513363277, "ground_truth": 0}, {"key": "40913011", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9278877961013127, "ground_truth": 0}, {"key": "40913011", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745188460633, "ground_truth": 0}, {"key": "29642545", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.32939172624174773, "ground_truth": 0}, {"key": "29642545", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3522017889802964, "ground_truth": 0}, {"key": "29642545", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.422504659794053, "ground_truth": 0}, {"key": "29642545", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.390475844914934, "ground_truth": 0}, {"key": "29642545", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814056102198622, "ground_truth": 0}, {"key": "35969159", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7690802563689557, "ground_truth": 0}, {"key": "35969159", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7295197805262721, "ground_truth": 0}, {"key": "35969159", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063665840151, "ground_truth": 0}, {"key": "35969159", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389894550381, "ground_truth": 0}, {"key": "35969159", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.699254420748635, "ground_truth": 0}, {"key": "37081669", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.20055766913278694, "ground_truth": 0}, {"key": "37081669", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35398630876691806, "ground_truth": 0}, {"key": "37081669", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42632160211334835, "ground_truth": 0}, {"key": "37081669", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881486967157, "ground_truth": 0}, {"key": "37081669", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2798284961676715, "ground_truth": 0}, {"key": "40048022", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6774740193342169, "ground_truth": 0}, {"key": "40048022", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7690802440310051, "ground_truth": 0}, {"key": "40048022", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.700894811549857, "ground_truth": 0}, {"key": "40048022", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210816063616, "ground_truth": 0}, {"key": "40048022", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321750388221, "ground_truth": 0}, {"key": "32884004", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8104789035698159, "ground_truth": 0}, {"key": "32884004", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9019206839325499, "ground_truth": 0}, {"key": "32884004", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8606036258238181, "ground_truth": 0}, {"key": "32884004", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869875178522, "ground_truth": 0}, {"key": "32884004", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.763483765553329, "ground_truth": 0}, {"key": "39022490", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8596637428287799, "ground_truth": 0}, {"key": "39022490", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8856314754729142, "ground_truth": 0}, {"key": "39022490", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7826624794776644, "ground_truth": 0}, {"key": "39022490", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835253974177, "ground_truth": 0}, {"key": "39022490", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253829609715, "ground_truth": 0}, {"key": "35159385", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.906653116854679, "ground_truth": 0}, {"key": "35159385", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8006920179417096, "ground_truth": 0}, {"key": "35159385", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.740174361893405, "ground_truth": 0}, {"key": "35159385", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392771322715, "ground_truth": 0}, {"key": "35159385", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942076796133, "ground_truth": 0}, {"key": "34363669", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3702254093314377, "ground_truth": 0}, {"key": "34363669", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.36296918220752444, "ground_truth": 0}, {"key": "34363669", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.37204878437537925, "ground_truth": 0}, {"key": "34363669", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252596010646584, "ground_truth": 0}, {"key": "34363669", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834041458065, "ground_truth": 0}, {"key": "36119687", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9278877914425421, "ground_truth": 0}, {"key": "36119687", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8407826073538515, "ground_truth": 0}, {"key": "36119687", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9462003530420304, "ground_truth": 0}, {"key": "36119687", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9618217246132487, "ground_truth": 0}, {"key": "36119687", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9362850053957563, "ground_truth": 0}, {"key": "35217446", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8587185899217192, "ground_truth": 0}, {"key": "35217446", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544265729378, "ground_truth": 0}, {"key": "35217446", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8976952965684795, "ground_truth": 0}, {"key": "35217446", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748763101642, "ground_truth": 0}, {"key": "35217446", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245980709588, "ground_truth": 0}, {"key": "39049331", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.834406888371673, "ground_truth": 0}, {"key": "39049331", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.911179706360587, "ground_truth": 0}, {"key": "39049331", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8300437688014837, "ground_truth": 0}, {"key": "39049331", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933435958853, "ground_truth": 0}, {"key": "39049331", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.875786988796781, "ground_truth": 0}, {"key": "36472242", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8278281619307627, "ground_truth": 0}, {"key": "36472242", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8832359889411349, "ground_truth": 0}, {"key": "36472242", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9289263251735167, "ground_truth": 0}, {"key": "36472242", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297756027575, "ground_truth": 0}, {"key": "36472242", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923115872104, "ground_truth": 0}, {"key": "31854721", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8509646993892959, "ground_truth": 0}, {"key": "31854721", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8210441424593332, "ground_truth": 0}, {"key": "31854721", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8940517132792304, "ground_truth": 0}, {"key": "31854721", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702970636118, "ground_truth": 0}, {"key": "31854721", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.791821066558899, "ground_truth": 0}, {"key": "18725849", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5563995873704624, "ground_truth": 0}, {"key": "18725849", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5851011769207477, "ground_truth": 0}, {"key": "18725849", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6513548609696953, "ground_truth": 0}, {"key": "18725849", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512666264279, "ground_truth": 0}, {"key": "18725849", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046223554393, "ground_truth": 0}, {"key": "36883179", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3557749040724415, "ground_truth": 0}, {"key": "36883179", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4902356403668662, "ground_truth": 0}, {"key": "36883179", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3225259823915104, "ground_truth": 0}, {"key": "36883179", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531156009743, "ground_truth": 0}, {"key": "36883179", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220560846203928, "ground_truth": 0}, {"key": "34266359", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7476159671293351, "ground_truth": 0}, {"key": "34266359", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8757869853678828, "ground_truth": 0}, {"key": "34266359", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8289388019508234, "ground_truth": 0}, {"key": "34266359", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894620727506, "ground_truth": 0}, {"key": "34266359", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.839733983066347, "ground_truth": 0}, {"key": "31920289", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802676155057, "ground_truth": 0}, {"key": "31920289", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5253688164478205, "ground_truth": 0}, {"key": "31920289", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5156199510676599, "ground_truth": 0}, {"key": "31920289", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981163304850487, "ground_truth": 0}, {"key": "31920289", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030747178406, "ground_truth": 0}, {"key": "36292997", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575534185047, "ground_truth": 0}, {"key": "36292997", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7931059493114625, "ground_truth": 0}, {"key": "36292997", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8104789098579477, "ground_truth": 0}, {"key": "36292997", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631399460961, "ground_truth": 0}, {"key": "36292997", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.852935475498817, "ground_truth": 0}, {"key": "30412533", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8244619275200598, "ground_truth": 0}, {"key": "30412533", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8606036091155851, "ground_truth": 0}, {"key": "30412533", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.869714577120981, "ground_truth": 0}, {"key": "30412533", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767977095066, "ground_truth": 0}, {"key": "30412533", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339420695792, "ground_truth": 0}, {"key": "40433191", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9546474198312154, "ground_truth": 0}, {"key": "40433191", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9653811625431464, "ground_truth": 0}, {"key": "40433191", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9284087961425338, "ground_truth": 0}, {"key": "40433191", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.95598134841516, "ground_truth": 0}, {"key": "40433191", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9529258231992825, "ground_truth": 0}, {"key": "34565591", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3023910652514434, "ground_truth": 0}, {"key": "34565591", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.1801066604075242, "ground_truth": 0}, {"key": "34565591", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3684056811189043, "ground_truth": 0}, {"key": "34565591", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195576633688, "ground_truth": 0}, {"key": "34565591", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1393963832089247, "ground_truth": 0}, {"key": "36062480", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8791467563639329, "ground_truth": 0}, {"key": "36062480", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.845942445945511, "ground_truth": 0}, {"key": "36062480", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8816149103981316, "ground_truth": 0}, {"key": "36062480", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9339146173835355, "ground_truth": 0}, {"key": "36062480", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430283513785, "ground_truth": 0}, {"key": "37276883", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8925625319156995, "ground_truth": 0}, {"key": "37276883", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8233284091688311, "ground_truth": 0}, {"key": "37276883", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8438950959406117, "ground_truth": 0}, {"key": "37276883", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587911922048, "ground_truth": 0}, {"key": "37276883", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9339146218132909, "ground_truth": 0}, {"key": "38509260", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7185943750033076, "ground_truth": 0}, {"key": "38509260", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7534666586239511, "ground_truth": 0}, {"key": "38509260", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056319024216, "ground_truth": 0}, {"key": "38509260", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047022398424, "ground_truth": 0}, {"key": "38509260", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245993450853, "ground_truth": 0}, {"key": "37139607", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8887587860119619, "ground_truth": 0}, {"key": "37139607", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.885631479749372, "ground_truth": 0}, {"key": "37139607", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.892562524778306, "ground_truth": 0}, {"key": "37139607", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148324278054, "ground_truth": 0}, {"key": "37139607", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916199459297, "ground_truth": 0}, {"key": "37092824", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8418256440907633, "ground_truth": 0}, {"key": "37092824", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8529354803846224, "ground_truth": 0}, {"key": "37092824", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8925625321328261, "ground_truth": 0}, {"key": "37092824", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094053081457, "ground_truth": 0}, {"key": "37092824", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786178127489, "ground_truth": 0}, {"key": "32191802", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9600626890350875, "ground_truth": 0}, {"key": "32191802", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9219218272730051, "ground_truth": 0}, {"key": "32191802", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9688561703994775, "ground_truth": 0}, {"key": "32191802", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9832145092940913, "ground_truth": 0}, {"key": "32191802", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9603611574250921, "ground_truth": 0}, {"key": "39396038", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9500414769489357, "ground_truth": 0}, {"key": "39396038", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9618217269670936, "ground_truth": 0}, {"key": "39396038", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9420819109872581, "ground_truth": 0}, {"key": "39396038", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9572777990223855, "ground_truth": 0}, {"key": "39396038", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240163933493, "ground_truth": 0}, {"key": "39076884", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7154239995592899, "ground_truth": 0}, {"key": "39076884", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7826624762345037, "ground_truth": 0}, {"key": "39076884", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7745833864895866, "ground_truth": 0}, {"key": "39076884", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336803342314, "ground_truth": 0}, {"key": "39076884", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.675764611666641, "ground_truth": 0}, {"key": "27763432", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3979383995805481, "ground_truth": 0}, {"key": "27763432", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4629586178769134, "ground_truth": 0}, {"key": "27763432", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3225259796450793, "ground_truth": 0}, {"key": "27763432", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285232637623074, "ground_truth": 0}, {"key": "27763432", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.411110868625721, "ground_truth": 0}, {"key": "37806929", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8774767862383175, "ground_truth": 0}, {"key": "37806929", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8723473777741069, "ground_truth": 0}, {"key": "37806929", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8895288453567526, "ground_truth": 0}, {"key": "37806929", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494697142524, "ground_truth": 0}, {"key": "37806929", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625270098062, "ground_truth": 0}, {"key": "32334186", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8080672215146673, "ground_truth": 0}, {"key": "32334186", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8198933479938001, "ground_truth": 0}, {"key": "32334186", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7461390020802482, "ground_truth": 0}, {"key": "32334186", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.874077235929114, "ground_truth": 0}, {"key": "32334186", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359839014161, "ground_truth": 0}, {"key": "36187324", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6460137053883789, "ground_truth": 0}, {"key": "36187324", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8140527934691119, "ground_truth": 0}, {"key": "36187324", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8187367775302097, "ground_truth": 0}, {"key": "36187324", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324872205305, "ground_truth": 0}, {"key": "36187324", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278636312821, "ground_truth": 0}, {"key": "35306009", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9635062387823424, "ground_truth": 0}, {"key": "35306009", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.958537724751354, "ground_truth": 0}, {"key": "35306009", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9553191261999254, "ground_truth": 0}, {"key": "35306009", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9543079639764439, "ground_truth": 0}, {"key": "35306009", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9643214458775236, "ground_truth": 0}, {"key": "39490050", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.104477312423165, "ground_truth": 0}, {"key": "39490050", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33458945080794716, "ground_truth": 0}, {"key": "39490050", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.27982847457134546, "ground_truth": 0}, {"key": "39490050", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26284184371640373, "ground_truth": 0}, {"key": "39490050", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559407788024494, "ground_truth": 0}, {"key": "38072149", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419978186149, "ground_truth": 0}, {"key": "38072149", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5698526390298364, "ground_truth": 0}, {"key": "38072149", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7905303277977149, "ground_truth": 0}, {"key": "38072149", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506533285055, "ground_truth": 0}, {"key": "38072149", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582737060165, "ground_truth": 0}, {"key": "35899689", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7490872238346723, "ground_truth": 0}, {"key": "35899689", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.672331683598761, "ground_truth": 0}, {"key": "35899689", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8469578547193942, "ground_truth": 0}, {"key": "35899689", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346222836958, "ground_truth": 0}, {"key": "35899689", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036283718979, "ground_truth": 0}, {"key": "27994518", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6132365496635632, "ground_truth": 0}, {"key": "27994518", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5851011319180985, "ground_truth": 0}, {"key": "27994518", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7325918453519954, "ground_truth": 0}, {"key": "27994518", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.476579652279487, "ground_truth": 0}, {"key": "27994518", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828340577485596, "ground_truth": 0}, {"key": "10615479", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.16132023740125523, "ground_truth": 0}, {"key": "10615479", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.17667160755298084, "ground_truth": 0}, {"key": "10615479", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3056973173392694, "ground_truth": 0}, {"key": "10615479", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076628398276362, "ground_truth": 0}, {"key": "10615479", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.24653334616931902, "ground_truth": 0}, {"key": "40186667", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8969755721564588, "ground_truth": 0}, {"key": "40186667", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264255735842888, "ground_truth": 0}, {"key": "40186667", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8529354951051743, "ground_truth": 0}, {"key": "40186667", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.860603618449699, "ground_truth": 0}, {"key": "40186667", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624764039354, "ground_truth": 0}, {"key": "38622886", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8832359797166376, "ground_truth": 0}, {"key": "38622886", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5907792065513334, "ground_truth": 0}, {"key": "38622886", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.823328401913125, "ground_truth": 0}, {"key": "38622886", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767841529337, "ground_truth": 0}, {"key": "38622886", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647037510978, "ground_truth": 0}, {"key": "40686943", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.795658114395956, "ground_truth": 0}, {"key": "40686943", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256083327024, "ground_truth": 0}, {"key": "40686943", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7549149947610958, "ground_truth": 0}, {"key": "40686943", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437775370593, "ground_truth": 0}, {"key": "40686943", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467701925262, "ground_truth": 0}, {"key": "30604567", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.965119110428092, "ground_truth": 0}, {"key": "30604567", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9518632290379277, "ground_truth": 0}, {"key": "30604567", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9740426428294533, "ground_truth": 0}, {"key": "30604567", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9569571507991743, "ground_truth": 0}, {"key": "30604567", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9469902253854025, "ground_truth": 0}, {"key": "35440903", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8633916170200021, "ground_truth": 0}, {"key": "35440903", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8152324935785306, "ground_truth": 0}, {"key": "35440903", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8187367957745015, "ground_truth": 0}, {"key": "35440903", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149937697306, "ground_truth": 0}, {"key": "35440903", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312002608834, "ground_truth": 0}, {"key": "37219533", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5467381522324473, "ground_truth": 0}, {"key": "37219533", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5851011622933618, "ground_truth": 0}, {"key": "37219533", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.642432464412385, "ground_truth": 0}, {"key": "37219533", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216210944873, "ground_truth": 0}, {"key": "37219533", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397235189553, "ground_truth": 0}, {"key": "40178965", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8774767932019473, "ground_truth": 0}, {"key": "40178965", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9385759671505339, "ground_truth": 0}, {"key": "40178965", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8278281605318272, "ground_truth": 0}, {"key": "40178965", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206889983128, "ground_truth": 0}, {"key": "40178965", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299637348373, "ground_truth": 0}, {"key": "13750468", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6619228917185204, "ground_truth": 0}, {"key": "13750468", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791786759755557, "ground_truth": 0}, {"key": "13750468", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6076631689359477, "ground_truth": 0}, {"key": "13750468", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339702795369, "ground_truth": 0}, {"key": "13750468", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432073580821, "ground_truth": 0}, {"key": "17754949", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6601724067818997, "ground_truth": 0}, {"key": "17754949", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4054487252904895, "ground_truth": 0}, {"key": "17754949", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7325918453447731, "ground_truth": 0}, {"key": "17754949", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.734119533949195, "ground_truth": 0}, {"key": "17754949", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125728021946, "ground_truth": 0}, {"key": "36675623", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9678992905173585, "ground_truth": 0}, {"key": "36675623", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9664104937692671, "ground_truth": 0}, {"key": "36675623", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9556514199534304, "ground_truth": 0}, {"key": "36675623", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072534593071, "ground_truth": 0}, {"key": "36675623", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9709092454571846, "ground_truth": 0}, {"key": "40035440", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.985384331005449, "ground_truth": 0}, {"key": "40035440", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9860442888850309, "ground_truth": 0}, {"key": "40035440", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9416541602559637, "ground_truth": 0}, {"key": "40035440", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9640516791666994, "ground_truth": 0}, {"key": "40035440", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.96932419832786, "ground_truth": 0}, {"key": "37685909", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832215098005, "ground_truth": 0}, {"key": "37685909", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3923368367996724, "ground_truth": 0}, {"key": "37685909", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3647775448279345, "ground_truth": 0}, {"key": "37685909", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180142395454, "ground_truth": 0}, {"key": "37685909", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730879566594, "ground_truth": 0}, {"key": "36938787", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.833324596963325, "ground_truth": 0}, {"key": "36938787", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.642432484633544, "ground_truth": 0}, {"key": "36938787", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.824461938920072, "ground_truth": 0}, {"key": "36938787", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804547936693, "ground_truth": 0}, {"key": "36938787", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970850247847, "ground_truth": 0}, {"key": "39398068", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "39398068", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717666202293843, "ground_truth": 0}, {"key": "39398068", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6876300135168466, "ground_truth": 0}, {"key": "39398068", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073647311246, "ground_truth": 0}, {"key": "39398068", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762937840335, "ground_truth": 0}, {"key": "39926408", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4130035719090645, "ground_truth": 0}, {"key": "39926408", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6424324870435737, "ground_truth": 0}, {"key": "39926408", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46295860991955107, "ground_truth": 0}, {"key": "39926408", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279511969466627, "ground_truth": 0}, {"key": "39926408", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704657295725, "ground_truth": 0}, {"key": "40465336", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7676898553663029, "ground_truth": 0}, {"key": "40465336", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7662936416568402, "ground_truth": 0}, {"key": "40465336", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8255897234841977, "ground_truth": 0}, {"key": "40465336", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293649267172, "ground_truth": 0}, {"key": "40465336", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789021476614, "ground_truth": 0}, {"key": "34173549", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7549150186917903, "ground_truth": 0}, {"key": "34173549", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8386797772513233, "ground_truth": 0}, {"key": "34173549", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7185943790389514, "ground_truth": 0}, {"key": "34173549", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583419270799, "ground_truth": 0}, {"key": "34173549", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105536043645, "ground_truth": 0}, {"key": "33541535", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9092645109435409, "ground_truth": 0}, {"key": "33541535", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7138307611790966, "ground_truth": 0}, {"key": "33541535", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.695958323000654, "ground_truth": 0}, {"key": "33541535", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8955226728261989, "ground_truth": 0}, {"key": "33541535", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942213948982, "ground_truth": 0}, {"key": "35685195", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.794384973319082, "ground_truth": 0}, {"key": "35685195", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5058591127937063, "ground_truth": 0}, {"key": "35685195", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8587185860753296, "ground_truth": 0}, {"key": "35685195", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251098119502, "ground_truth": 0}, {"key": "35685195", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.712232199925895, "ground_truth": 0}, {"key": "28440730", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.16132024472197254, "ground_truth": 0}, {"key": "28440730", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.12940273269339567, "ground_truth": 0}, {"key": "28440730", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358313436915, "ground_truth": 0}, {"key": "28440730", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775422123625, "ground_truth": 0}, {"key": "28440730", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784114822472, "ground_truth": 0}, {"key": "38338714", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9241418219505658, "ground_truth": 0}, {"key": "38338714", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9399133534656924, "ground_truth": 0}, {"key": "38338714", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9653811593366379, "ground_truth": 0}, {"key": "38338714", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9546474214696912, "ground_truth": 0}, {"key": "38338714", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9403530616428949, "ground_truth": 0}, {"key": "32191881", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49023562477710214, "ground_truth": 0}, {"key": "32191881", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2814056053321093, "ground_truth": 0}, {"key": "32191881", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42059958294087724, "ground_truth": 0}, {"key": "32191881", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2450850120788627, "ground_truth": 0}, {"key": "32191881", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064750206761, "ground_truth": 0}, {"key": "37707251", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6076631642835794, "ground_truth": 0}, {"key": "37707251", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8940517108132372, "ground_truth": 0}, {"key": "37707251", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6876299854882362, "ground_truth": 0}, {"key": "37707251", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723873619705, "ground_truth": 0}, {"key": "37707251", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918405780847, "ground_truth": 0}, {"key": "40172567", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6001883907147649, "ground_truth": 0}, {"key": "40172567", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40168779203329097, "ground_truth": 0}, {"key": "40172567", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370307943276022, "ground_truth": 0}, {"key": "40172567", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102483760465, "ground_truth": 0}, {"key": "40172567", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864511916790336, "ground_truth": 0}, {"key": "33113255", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8449215313508475, "ground_truth": 0}, {"key": "33113255", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8529354829926898, "ground_truth": 0}, {"key": "33113255", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8479677725116916, "ground_truth": 0}, {"key": "33113255", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437797289631, "ground_truth": 0}, {"key": "33113255", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677673445539, "ground_truth": 0}, {"key": "33022143", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.32939170829143527, "ground_truth": 0}, {"key": "33022143", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4532618108927884, "ground_truth": 0}, {"key": "33022143", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42441198074059866, "ground_truth": 0}, {"key": "33022143", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883402799086, "ground_truth": 0}, {"key": "33022143", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4035668594855307, "ground_truth": 0}, {"key": "32084473", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.897695289967725, "ground_truth": 0}, {"key": "32084473", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9252299485456158, "ground_truth": 0}, {"key": "32084473", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9184802370278976, "ground_truth": 0}, {"key": "32084473", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9230391732311397, "ground_truth": 0}, {"key": "32084473", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933287069098, "ground_truth": 0}, {"key": "40564245", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5175708892233502, "ground_truth": 0}, {"key": "40564245", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8080672086927787, "ground_truth": 0}, {"key": "40564245", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170118981307174, "ground_truth": 0}, {"key": "40564245", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832063921703, "ground_truth": 0}, {"key": "40564245", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526343977313, "ground_truth": 0}, {"key": "31717213", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5640984687433743, "ground_truth": 0}, {"key": "31717213", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7431680006991316, "ground_truth": 0}, {"key": "31717213", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8365545678150808, "ground_truth": 0}, {"key": "31717213", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680287842017, "ground_truth": 0}, {"key": "31717213", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982295308561, "ground_truth": 0}, {"key": "34861894", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6976089237785894, "ground_truth": 0}, {"key": "34861894", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6113819742113465, "ground_truth": 0}, {"key": "34861894", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4707365945286735, "ground_truth": 0}, {"key": "34861894", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149822881885, "ground_truth": 0}, {"key": "34861894", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170119041104778, "ground_truth": 0}, {"key": "40838760", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8933094245433832, "ground_truth": 0}, {"key": "40838760", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8749346303500086, "ground_truth": 0}, {"key": "40838760", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7918210759090827, "ground_truth": 0}, {"key": "40838760", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344069000538366, "ground_truth": 0}, {"key": "40838760", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891371233218, "ground_truth": 0}, {"key": "40044849", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9130583428216471, "ground_truth": 0}, {"key": "40044849", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8864204171334318, "ground_truth": 0}, {"key": "40044849", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8969755723924585, "ground_truth": 0}, {"key": "40044849", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053223015908182, "ground_truth": 0}, {"key": "40044849", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919940261319, "ground_truth": 0}, {"key": "30296116", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4785288308102185, "ground_truth": 0}, {"key": "30296116", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6334102783700518, "ground_truth": 0}, {"key": "30296116", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.44167303026409316, "ground_truth": 0}, {"key": "30296116", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880180940547, "ground_truth": 0}, {"key": "30296116", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907613545208814, "ground_truth": 0}, {"key": "34931360", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6057990488959241, "ground_truth": 0}, {"key": "34931360", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7446563331143999, "ground_truth": 0}, {"key": "34931360", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5907791984662684, "ground_truth": 0}, {"key": "34931360", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105548643781, "ground_truth": 0}, {"key": "34931360", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004174107359, "ground_truth": 0}, {"key": "18862422", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6132365423286074, "ground_truth": 0}, {"key": "18862422", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7981867841254152, "ground_truth": 0}, {"key": "18862422", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46295861265571414, "ground_truth": 0}, {"key": "18862422", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.613236587412887, "ground_truth": 0}, {"key": "18862422", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014733580682807, "ground_truth": 0}, {"key": "36361140", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9653811602094279, "ground_truth": 0}, {"key": "36361140", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9196425358672538, "ground_truth": 0}, {"key": "36361140", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9437636542746372, "ground_truth": 0}, {"key": "36361140", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9213576235029414, "ground_truth": 0}, {"key": "36361140", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012708155393, "ground_truth": 0}, {"key": "39703329", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.16026602257975098, "ground_truth": 0}, {"key": "39703329", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.38676344633468307, "ground_truth": 0}, {"key": "39703329", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2213506863964527, "ground_truth": 0}, {"key": "39703329", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651623510024014, "ground_truth": 0}, {"key": "39703329", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733751412369778, "ground_truth": 0}, {"key": "34033324", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9465966694146245, "ground_truth": 0}, {"key": "34033324", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9453993983905321, "ground_truth": 0}, {"key": "34033324", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8438950930893953, "ground_truth": 0}, {"key": "34033324", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9730365033856818, "ground_truth": 0}, {"key": "34033324", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.955651417593744, "ground_truth": 0}, {"key": "35658862", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8068526244846895, "ground_truth": 0}, {"key": "35658862", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8732148241390083, "ground_truth": 0}, {"key": "35658862", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8428631467918093, "ground_truth": 0}, {"key": "35658862", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.79182107550534, "ground_truth": 0}, {"key": "35658862", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047297883947, "ground_truth": 0}, {"key": "36092657", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8164063711026431, "ground_truth": 0}, {"key": "36092657", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8068526142084512, "ground_truth": 0}, {"key": "36092657", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704647826564823, "ground_truth": 0}, {"key": "36092657", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210863733556, "ground_truth": 0}, {"key": "36092657", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175058301659, "ground_truth": 0}, {"key": "26333438", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4111108812169387, "ground_truth": 0}, {"key": "26333438", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6808786196672572, "ground_truth": 0}, {"key": "26333438", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6187804425376825, "ground_truth": 0}, {"key": "26333438", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974733984912734, "ground_truth": 0}, {"key": "26333438", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.753466657979881, "ground_truth": 0}, {"key": "34184963", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4436004142751647, "ground_truth": 0}, {"key": "34184963", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8152324984102467, "ground_truth": 0}, {"key": "34184963", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.44360042358295887, "ground_truth": 0}, {"key": "34184963", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384051225865, "ground_truth": 0}, {"key": "34184963", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004242920949, "ground_truth": 0}, {"key": "35069975", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7310585745702768, "ground_truth": 0}, {"key": "35069975", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7295197626336595, "ground_truth": 0}, {"key": "35069975", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7969253704872357, "ground_truth": 0}, {"key": "35069975", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953753800917, "ground_truth": 0}, {"key": "35069975", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526306289916, "ground_truth": 0}, {"key": "36443950", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.43206339686624623, "ground_truth": 0}, {"key": "36443950", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31742627083540564, "ground_truth": 0}, {"key": "36443950", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5156199145944387, "ground_truth": 0}, {"key": "36443950", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984143878399, "ground_truth": 0}, {"key": "36443950", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118745072319, "ground_truth": 0}, {"key": "29460858", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.28937169381606886, "ground_truth": 0}, {"key": "29460858", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2295351995850161, "ground_truth": 0}, {"key": "29460858", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38306417641837115, "ground_truth": 0}, {"key": "29460858", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259812372798, "ground_truth": 0}, {"key": "29460858", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3242353891741126, "ground_truth": 0}, {"key": "36155704", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.445529542966606, "ground_truth": 0}, {"key": "36155704", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3398276241936595, "ground_truth": 0}, {"key": "36155704", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.29910518705340083, "ground_truth": 0}, {"key": "36155704", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3157359808847186, "ground_truth": 0}, {"key": "36155704", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.42823342769630846, "ground_truth": 0}, {"key": "37185211", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9213576225220934, "ground_truth": 0}, {"key": "37185211", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804279536127, "ground_truth": 0}, {"key": "37185211", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8558511424111888, "ground_truth": 0}, {"key": "37185211", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288438364894, "ground_truth": 0}, {"key": "37185211", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840430541023, "ground_truth": 0}, {"key": "36454885", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6943026704986653, "ground_truth": 0}, {"key": "36454885", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5292634005965628, "ground_truth": 0}, {"key": "36454885", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4707365988575939, "ground_truth": 0}, {"key": "36454885", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476737107038, "ground_truth": 0}, {"key": "36454885", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.658417493016537, "ground_truth": 0}, {"key": "33148906", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3380771465501251, "ground_truth": 0}, {"key": "33148906", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3451052703557452, "ground_truth": 0}, {"key": "33148906", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22405544900402813, "ground_truth": 0}, {"key": "33148906", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681738615456, "ground_truth": 0}, {"key": "33148906", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.19806417634248735, "ground_truth": 0}, {"key": "18086604", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2704802317883841, "ground_truth": 0}, {"key": "18086604", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3007455581126985, "ground_truth": 0}, {"key": "18086604", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30569731281761753, "ground_truth": 0}, {"key": "18086604", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.22678362319416082, "ground_truth": 0}, {"key": "18086604", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730938023345, "ground_truth": 0}, {"key": "33693397", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6513548580883689, "ground_truth": 0}, {"key": "33693397", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7401743696122203, "ground_truth": 0}, {"key": "33693397", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170118823511423, "ground_truth": 0}, {"key": "33693397", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.640635861237138, "ground_truth": 0}, {"key": "33693397", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740269571872, "ground_truth": 0}, {"key": "39501530", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5195213307130395, "ground_truth": 0}, {"key": "39501530", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2598256446502914, "ground_truth": 0}, {"key": "39501530", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.28298813194632255, "ground_truth": 0}, {"key": "39501530", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098086669705825, "ground_truth": 0}, {"key": "39501530", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1993079983793348, "ground_truth": 0}, {"key": "30948874", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.760650636730999, "ground_truth": 0}, {"key": "30948874", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8606036298837036, "ground_truth": 0}, {"key": "30948874", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8344068938307969, "ground_truth": 0}, {"key": "30948874", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748648238896, "ground_truth": 0}, {"key": "30948874", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418224153253, "ground_truth": 0}, {"key": "39410675", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8210441131994843, "ground_truth": 0}, {"key": "39410675", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8848377773402151, "ground_truth": 0}, {"key": "39410675", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7943849694091549, "ground_truth": 0}, {"key": "39410675", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767766336896, "ground_truth": 0}, {"key": "39410675", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358379376627, "ground_truth": 0}, {"key": "32903337", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.34864515298550797, "ground_truth": 0}, {"key": "32903337", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3056973266234782, "ground_truth": 0}, {"key": "32903337", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4590761424893625, "ground_truth": 0}, {"key": "32903337", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876300110243884, "ground_truth": 0}, {"key": "32903337", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073660354937336, "ground_truth": 0}, {"key": "27685132", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.622459320609574, "ground_truth": 0}, {"key": "27685132", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5273165388672664, "ground_truth": 0}, {"key": "27685132", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6020615847488912, "ground_truth": 0}, {"key": "27685132", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331543928316241, "ground_truth": 0}, {"key": "27685132", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771102509148, "ground_truth": 0}, {"key": "22791471", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7490872178719709, "ground_truth": 0}, {"key": "22791471", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6926419780410208, "ground_truth": 0}, {"key": "22791471", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8539127405016755, "ground_truth": 0}, {"key": "22791471", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256384592699, "ground_truth": 0}, {"key": "22791471", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.600188381964403, "ground_truth": 0}, {"key": "32292348", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8152325001740509, "ground_truth": 0}, {"key": "32292348", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7341195255667727, "ground_truth": 0}, {"key": "32292348", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8300437576741598, "ground_truth": 0}, {"key": "32292348", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665955099591, "ground_truth": 0}, {"key": "32292348", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.796925371449792, "ground_truth": 0}, {"key": "20482930", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575647891301, "ground_truth": 0}, {"key": "20482930", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7431680123040254, "ground_truth": 0}, {"key": "20482930", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6076631455365884, "ground_truth": 0}, {"key": "20482930", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191546642162, "ground_truth": 0}, {"key": "20482930", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318383710801, "ground_truth": 0}, {"key": "11635754", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6671476544273203, "ground_truth": 0}, {"key": "11635754", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5350984222215938, "ground_truth": 0}, {"key": "11635754", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8688267816428202, "ground_truth": 0}, {"key": "11635754", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346239005182, "ground_truth": 0}, {"key": "11635754", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744723460806, "ground_truth": 0}, {"key": "40029096", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6774740206842951, "ground_truth": 0}, {"key": "40029096", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6242935223341388, "ground_truth": 0}, {"key": "40029096", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6495786218101816, "ground_truth": 0}, {"key": "40029096", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.675764593555312, "ground_truth": 0}, {"key": "40029096", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754690010307, "ground_truth": 0}, {"key": "40414719", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9449947077033503, "ground_truth": 0}, {"key": "40414719", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9674102537528109, "ground_truth": 0}, {"key": "40414719", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9645892689654388, "ground_truth": 0}, {"key": "40414719", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9362850067758071, "ground_truth": 0}, {"key": "40414719", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.925768625765368, "ground_truth": 0}, {"key": "39537616", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.819893327631152, "ground_truth": 0}, {"key": "39537616", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8529354798121569, "ground_truth": 0}, {"key": "39537616", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6976089095682212, "ground_truth": 0}, {"key": "39537616", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307738635623, "ground_truth": 0}, {"key": "39537616", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253738692785, "ground_truth": 0}, {"key": "33245830", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2829881405246637, "ground_truth": 0}, {"key": "33245830", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3380771292793151, "ground_truth": 0}, {"key": "33245830", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.19072404390405315, "ground_truth": 0}, {"key": "33245830", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610034421531, "ground_truth": 0}, {"key": "33245830", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2254166024096403, "ground_truth": 0}, {"key": "39243601", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.704160143175825, "ground_truth": 0}, {"key": "39243601", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.707404684333238, "ground_truth": 0}, {"key": "39243601", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5907792113107854, "ground_truth": 0}, {"key": "39243601", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.498046848863049, "ground_truth": 0}, {"key": "39243601", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195238028897, "ground_truth": 0}, {"key": "35815905", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5331544102933052, "ground_truth": 0}, {"key": "35815905", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5292633881543878, "ground_truth": 0}, {"key": "35815905", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.25832597489477954, "ground_truth": 0}, {"key": "35815905", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.558326982046485, "ground_truth": 0}, {"key": "35815905", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878610544136, "ground_truth": 0}, {"key": "35260212", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7310585904928304, "ground_truth": 0}, {"key": "35260212", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7138307646156185, "ground_truth": 0}, {"key": "35260212", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5945512770946685, "ground_truth": 0}, {"key": "35260212", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.75491498839435, "ground_truth": 0}, {"key": "35260212", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240038480704, "ground_truth": 0}, {"key": "39193924", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4513265027895413, "ground_truth": 0}, {"key": "39193924", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6976089426636154, "ground_truth": 0}, {"key": "39193924", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43590150247374043, "ground_truth": 0}, {"key": "39193924", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358312716607, "ground_truth": 0}, {"key": "39193924", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730020943218, "ground_truth": 0}, {"key": "40658569", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40922076591066314, "ground_truth": 0}, {"key": "40658569", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717665951926924, "ground_truth": 0}, {"key": "40658569", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46684561446805856, "ground_truth": 0}, {"key": "40658569", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078119025217136, "ground_truth": 0}, {"key": "40658569", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45713672132970007, "ground_truth": 0}, {"key": "33497596", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8774768008550875, "ground_truth": 0}, {"key": "33497596", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7041601537431904, "ground_truth": 0}, {"key": "33497596", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063835239035, "ground_truth": 0}, {"key": "33497596", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506494105578, "ground_truth": 0}, {"key": "33497596", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721800517451, "ground_truth": 0}, {"key": "40339241", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7520125585571982, "ground_truth": 0}, {"key": "40339241", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8499711725526379, "ground_truth": 0}, {"key": "40339241", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063774757416, "ground_truth": 0}, {"key": "40339241", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175032428212, "ground_truth": 0}, {"key": "40339241", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581590762276, "ground_truth": 0}, {"key": "31792608", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7634837617133824, "ground_truth": 0}, {"key": "31792608", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757646136069002, "ground_truth": 0}, {"key": "31792608", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7826624637603925, "ground_truth": 0}, {"key": "31792608", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056002281516, "ground_truth": 0}, {"key": "31792608", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011516054927, "ground_truth": 0}, {"key": "33132662", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7279754525550951, "ground_truth": 0}, {"key": "33132662", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544345133676, "ground_truth": 0}, {"key": "33132662", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.350421357625353, "ground_truth": 0}, {"key": "33132662", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.786622814779878, "ground_truth": 0}, {"key": "33132662", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990163830305, "ground_truth": 0}, {"key": "37577457", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5698526745230844, "ground_truth": 0}, {"key": "37577457", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42250462587251875, "ground_truth": 0}, {"key": "37577457", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5621764910333907, "ground_truth": 0}, {"key": "37577457", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303308093309, "ground_truth": 0}, {"key": "37577457", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786071415246, "ground_truth": 0}, {"key": "38701278", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7905303150892562, "ground_truth": 0}, {"key": "38701278", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8740772386750549, "ground_truth": 0}, {"key": "38701278", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8679338488886703, "ground_truth": 0}, {"key": "38701278", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952950232481, "ground_truth": 0}, {"key": "38701278", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531210454596, "ground_truth": 0}, {"key": "34570783", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8910549605696128, "ground_truth": 0}, {"key": "34570783", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9416541633265875, "ground_truth": 0}, {"key": "34570783", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8705972482705323, "ground_truth": 0}, {"key": "34570783", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511360561196, "ground_truth": 0}, {"key": "34570783", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531228597482, "ground_truth": 0}, {"key": "39064526", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8006920144537523, "ground_truth": 0}, {"key": "39064526", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791787028343045, "ground_truth": 0}, {"key": "39064526", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063782504593, "ground_truth": 0}, {"key": "39064526", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528112197722, "ground_truth": 0}, {"key": "39064526", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159420224849, "ground_truth": 0}, {"key": "40741545", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7185943879414805, "ground_truth": 0}, {"key": "40741545", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7431680123802298, "ground_truth": 0}, {"key": "40741545", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7446563475272249, "ground_truth": 0}, {"key": "40741545", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898601461788, "ground_truth": 0}, {"key": "40741545", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381595244916, "ground_truth": 0}, {"key": "36929751", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9252299492105445, "ground_truth": 0}, {"key": "36929751", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9246876935624022, "ground_truth": 0}, {"key": "36929751", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9640516770021352, "ground_truth": 0}, {"key": "36929751", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9761291643029529, "ground_truth": 0}, {"key": "36929751", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9666631741324964, "ground_truth": 0}, {"key": "23984730", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3960681702174472, "ground_truth": 0}, {"key": "23984730", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3380771454762781, "ground_truth": 0}, {"key": "23984730", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3504213868197622, "ground_truth": 0}, {"key": "23984730", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.20817893506197258, "ground_truth": 0}, {"key": "23984730", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3504213839539559, "ground_truth": 0}, {"key": "36007415", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9235923186659658, "ground_truth": 0}, {"key": "36007415", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9674102554157842, "ground_truth": 0}, {"key": "36007415", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9358173499888092, "ground_truth": 0}, {"key": "36007415", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9252299602006705, "ground_truth": 0}, {"key": "36007415", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9671630409442171, "ground_truth": 0}, {"key": "38875041", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8128673328885899, "ground_truth": 0}, {"key": "38875041", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9155072480487702, "ground_truth": 0}, {"key": "38875041", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8697145724942705, "ground_truth": 0}, {"key": "38875041", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354720642843, "ground_truth": 0}, {"key": "38875041", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314811348127, "ground_truth": 0}]