[{"key": "35232142", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5813030712132541, "ground_truth": 0}, {"key": "35232142", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6187804545856669, "ground_truth": 0}, {"key": "35232142", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6020615939171357, "ground_truth": 0}, {"key": "35232142", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.409220800847995, "ground_truth": 0}, {"key": "35232142", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964235847125, "ground_truth": 0}, {"key": "40143035", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8714748529024997, "ground_truth": 0}, {"key": "40143035", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8300437749273086, "ground_truth": 0}, {"key": "40143035", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104789188479922, "ground_truth": 0}, {"key": "40143035", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.743168025965654, "ground_truth": 0}, {"key": "40143035", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637476000171, "ground_truth": 0}, {"key": "35951548", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8548846513575821, "ground_truth": 0}, {"key": "35951548", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8940517108263952, "ground_truth": 0}, {"key": "35951548", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637455343157, "ground_truth": 0}, {"key": "35951548", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325130610606, "ground_truth": 0}, {"key": "35951548", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711616344278, "ground_truth": 0}, {"key": "36266422", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6808786285111242, "ground_truth": 0}, {"key": "36266422", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6808786051116487, "ground_truth": 0}, {"key": "36266422", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6601723767274356, "ground_truth": 0}, {"key": "36266422", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666125956361, "ground_truth": 0}, {"key": "36266422", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324722707725, "ground_truth": 0}, {"key": "38826984", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.699254408055923, "ground_truth": 0}, {"key": "38826984", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7248702726476401, "ground_truth": 0}, {"key": "38826984", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7106283072385077, "ground_truth": 0}, {"key": "38826984", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891360330161, "ground_truth": 0}, {"key": "38826984", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389994507633, "ground_truth": 0}, {"key": "34540833", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7745833709844872, "ground_truth": 0}, {"key": "34540833", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8864204088620966, "ground_truth": 0}, {"key": "34540833", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867856917746, "ground_truth": 0}, {"key": "34540833", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325075956795, "ground_truth": 0}, {"key": "34540833", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.84695782941727, "ground_truth": 0}, {"key": "20836172", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.862467539864669, "ground_truth": 0}, {"key": "20836172", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8386797484200168, "ground_truth": 0}, {"key": "20836172", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006920130380016, "ground_truth": 0}, {"key": "20836172", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367987443965, "ground_truth": 0}, {"key": "20836172", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239950214109, "ground_truth": 0}, {"key": "35932467", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7264256068046149, "ground_truth": 0}, {"key": "35932467", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.79692537257298, "ground_truth": 0}, {"key": "35932467", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7704647877667169, "ground_truth": 0}, {"key": "35932467", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199596712751, "ground_truth": 0}, {"key": "35932467", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324815602782, "ground_truth": 0}, {"key": "40758845", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9032942082388183, "ground_truth": 0}, {"key": "40758845", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8519528100742613, "ground_truth": 0}, {"key": "40758845", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9012274104306908, "ground_truth": 0}, {"key": "40758845", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336990201292, "ground_truth": 0}, {"key": "40758845", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213826571225, "ground_truth": 0}, {"key": "30358490", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.870597268764774, "ground_truth": 0}, {"key": "30358490", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6893056384306512, "ground_truth": 0}, {"key": "30358490", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849696727939, "ground_truth": 0}, {"key": "30358490", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743694090975, "ground_truth": 0}, {"key": "30358490", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631532451876, "ground_truth": 0}, {"key": "34615665", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.946990230620771, "ground_truth": 0}, {"key": "34615665", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.94539939415003, "ground_truth": 0}, {"key": "34615665", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9559813498941915, "ground_truth": 0}, {"key": "34615665", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892675745829, "ground_truth": 0}, {"key": "34615665", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923192294077, "ground_truth": 0}, {"key": "35890902", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8548846491598036, "ground_truth": 0}, {"key": "35890902", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8529354746060448, "ground_truth": 0}, {"key": "35890902", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8679338457220328, "ground_truth": 0}, {"key": "35890902", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148291610383, "ground_truth": 0}, {"key": "35890902", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424296783704, "ground_truth": 0}, {"key": "37922330", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892337008447958, "ground_truth": 0}, {"key": "37922330", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7074047040409939, "ground_truth": 0}, {"key": "37922330", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6774740103786115, "ground_truth": 0}, {"key": "37922330", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592253901267075, "ground_truth": 0}, {"key": "37922330", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085755047143, "ground_truth": 0}, {"key": "30844962", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4092208083469761, "ground_truth": 0}, {"key": "30844962", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6859494466206412, "ground_truth": 0}, {"key": "30844962", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7690802590075037, "ground_truth": 0}, {"key": "30844962", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199226612119, "ground_truth": 0}, {"key": "30844962", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326185301647787, "ground_truth": 0}, {"key": "36217333", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6187804396045888, "ground_truth": 0}, {"key": "36217333", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6132365468242774, "ground_truth": 0}, {"key": "36217333", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7185943615494744, "ground_truth": 0}, {"key": "36217333", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581462403136, "ground_truth": 0}, {"key": "36217333", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850300416325, "ground_truth": 0}, {"key": "30816523", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228214322427, "ground_truth": 0}, {"key": "30816523", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7563575732823642, "ground_truth": 0}, {"key": "30816523", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867837952157, "ground_truth": 0}, {"key": "30816523", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256049483292, "ground_truth": 0}, {"key": "30816523", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307382688838, "ground_truth": 0}, {"key": "38900884", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204152813406, "ground_truth": 0}, {"key": "38900884", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9161096098064055, "ground_truth": 0}, {"key": "38900884", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9105453968989411, "ground_truth": 0}, {"key": "38900884", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096181431878, "ground_truth": 0}, {"key": "38900884", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325116305424, "ground_truth": 0}, {"key": "13890581", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9073122260385753, "ground_truth": 0}, {"key": "13890581", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619292035457, "ground_truth": 0}, {"key": "13890581", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8187368093429848, "ground_truth": 0}, {"key": "13890581", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.848972198611282, "ground_truth": 0}, {"key": "13890581", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441162216588, "ground_truth": 0}, {"key": "40194700", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7956581013915806, "ground_truth": 0}, {"key": "40194700", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8529354857634778, "ground_truth": 0}, {"key": "40194700", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8233284027298867, "ground_truth": 0}, {"key": "40194700", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619349438888, "ground_truth": 0}, {"key": "40194700", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952890448343, "ground_truth": 0}, {"key": "37903647", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5964331399830121, "ground_truth": 0}, {"key": "37903647", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.804405925702159, "ground_truth": 0}, {"key": "37903647", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7295197866978957, "ground_truth": 0}, {"key": "37903647", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303329105695, "ground_truth": 0}, {"key": "37903647", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647896021097, "ground_truth": 0}, {"key": "13291223", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6388352632581796, "ground_truth": 0}, {"key": "13291223", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7386690880565632, "ground_truth": 0}, {"key": "13291223", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6706082881990633, "ground_truth": 0}, {"key": "13291223", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701239647373, "ground_truth": 0}, {"key": "13291223", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891337510464, "ground_truth": 0}, {"key": "36052570", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6442251086721744, "ground_truth": 0}, {"key": "36052570", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744735858538, "ground_truth": 0}, {"key": "36052570", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6976089102178512, "ground_truth": 0}, {"key": "36052570", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953661986956, "ground_truth": 0}, {"key": "36052570", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308192083598, "ground_truth": 0}, {"key": "34944735", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6688802545471523, "ground_truth": 0}, {"key": "34944735", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8714748733676281, "ground_truth": 0}, {"key": "34944735", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8300437693863987, "ground_truth": 0}, {"key": "34944735", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950967968857, "ground_truth": 0}, {"key": "34944735", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142539832196, "ground_truth": 0}, {"key": "32159602", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6242935135259451, "ground_truth": 0}, {"key": "32159602", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898520671008, "ground_truth": 0}, {"key": "32159602", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5467381401077224, "ground_truth": 0}, {"key": "32159602", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.740174343150369, "ground_truth": 0}, {"key": "32159602", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916170608896, "ground_truth": 0}, {"key": "34988915", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7138307513772152, "ground_truth": 0}, {"key": "34988915", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303078848643, "ground_truth": 0}, {"key": "34988915", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7201714886515511, "ground_truth": 0}, {"key": "34988915", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585592114144, "ground_truth": 0}, {"key": "34988915", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918343266045, "ground_truth": 0}, {"key": "37889203", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7799929121369735, "ground_truth": 0}, {"key": "37889203", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9230391632199748, "ground_truth": 0}, {"key": "37889203", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8529354912517683, "ground_truth": 0}, {"key": "37889203", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204031461816, "ground_truth": 0}, {"key": "37889203", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343727429003, "ground_truth": 0}, {"key": "33609927", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8539127454729581, "ground_truth": 0}, {"key": "33609927", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681150624069, "ground_truth": 0}, {"key": "33609927", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.836554566279469, "ground_truth": 0}, {"key": "33609927", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311874486252, "ground_truth": 0}, {"key": "33609927", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760086074831, "ground_truth": 0}, {"key": "33578778", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.675764600325108, "ground_truth": 0}, {"key": "33578778", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8333245906982861, "ground_truth": 0}, {"key": "33578778", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8255897378107956, "ground_truth": 0}, {"key": "33578778", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.764891617658238, "ground_truth": 0}, {"key": "33578778", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.774583397825558, "ground_truth": 0}, {"key": "36888270", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9066531275027925, "ground_truth": 0}, {"key": "36888270", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7264256127964246, "ground_truth": 0}, {"key": "36888270", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8056321815552556, "ground_truth": 0}, {"key": "36888270", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.816406381959971, "ground_truth": 0}, {"key": "36888270", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640119405909, "ground_truth": 0}, {"key": "36846007", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9775429450382818, "ground_truth": 0}, {"key": "36846007", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9658995755320449, "ground_truth": 0}, {"key": "36846007", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9651191152722408, "ground_truth": 0}, {"key": "36846007", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9618217261584059, "ground_truth": 0}, {"key": "36846007", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9462003554431374, "ground_truth": 0}, {"key": "31723471", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7233094824692, "ground_truth": 0}, {"key": "31723471", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7969253675928344, "ground_truth": 0}, {"key": "31723471", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5679365974366124, "ground_truth": 0}, {"key": "31723471", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.699254409276907, "ground_truth": 0}, {"key": "31723471", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.783988463252277, "ground_truth": 0}, {"key": "15921828", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850393335768, "ground_truth": 0}, {"key": "15921828", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6808786193869781, "ground_truth": 0}, {"key": "15921828", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6943026869068064, "ground_truth": 0}, {"key": "15921828", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093859049503, "ground_truth": 0}, {"key": "15921828", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.66714766490659, "ground_truth": 0}, {"key": "39109408", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6132365926899414, "ground_truth": 0}, {"key": "39109408", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4941408855388973, "ground_truth": 0}, {"key": "39109408", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7264255911525979, "ground_truth": 0}, {"key": "39109408", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.533154413519074, "ground_truth": 0}, {"key": "39109408", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990490438974, "ground_truth": 0}, {"key": "20936833", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.39420097602739024, "ground_truth": 0}, {"key": "20936833", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5813031038816466, "ground_truth": 0}, {"key": "20936833", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.540923880338497, "ground_truth": 0}, {"key": "20936833", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468656860063, "ground_truth": 0}, {"key": "20936833", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938155386381, "ground_truth": 0}, {"key": "36832879", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185943922086946, "ground_truth": 0}, {"key": "36832879", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8344068991096169, "ground_truth": 0}, {"key": "36832879", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7662936355543376, "ground_truth": 0}, {"key": "36832879", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336989031155, "ground_truth": 0}, {"key": "36832879", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245910452516, "ground_truth": 0}, {"key": "14958201", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357566953948, "ground_truth": 0}, {"key": "14958201", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9142907235892619, "ground_truth": 0}, {"key": "14958201", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619341074304, "ground_truth": 0}, {"key": "14958201", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646991291624, "ground_truth": 0}, {"key": "14958201", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531214845838, "ground_truth": 0}, {"key": "34352262", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.384912143847066, "ground_truth": 0}, {"key": "34352262", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.3106943773189027, "ground_truth": 0}, {"key": "34352262", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.45519861851204557, "ground_truth": 0}, {"key": "34352262", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.43014735684386385, "ground_truth": 0}, {"key": "34352262", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.41679665679376987, "ground_truth": 0}, {"key": "39805395", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.445529549594911, "ground_truth": 0}, {"key": "39805395", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.48242910271805634, "ground_truth": 0}, {"key": "39805395", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6584174982645374, "ground_truth": 0}, {"key": "39805395", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300567916354, "ground_truth": 0}, {"key": "39805395", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640048476121, "ground_truth": 0}, {"key": "34303109", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4416730112729327, "ground_truth": 0}, {"key": "34303109", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5312093764980858, "ground_truth": 0}, {"key": "34303109", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6757645974234928, "ground_truth": 0}, {"key": "34303109", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734972913354, "ground_truth": 0}, {"key": "34303109", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786751247371, "ground_truth": 0}, {"key": "39939090", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8418256617363272, "ground_truth": 0}, {"key": "39939090", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.801935833659259, "ground_truth": 0}, {"key": "39939090", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159557927289, "ground_truth": 0}, {"key": "39939090", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142471771139, "ground_truth": 0}, {"key": "39939090", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240808882694, "ground_truth": 0}, {"key": "29347771", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6688802296932657, "ground_truth": 0}, {"key": "29347771", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7918210776831142, "ground_truth": 0}, {"key": "29347771", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7520125524623003, "ground_truth": 0}, {"key": "29347771", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738014789833, "ground_truth": 0}, {"key": "29347771", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918121078101, "ground_truth": 0}, {"key": "36783415", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382060061564, "ground_truth": 0}, {"key": "36783415", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5813031059944281, "ground_truth": 0}, {"key": "36783415", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8354835311720265, "ground_truth": 0}, {"key": "36783415", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199541067003, "ground_truth": 0}, {"key": "36783415", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850319347115, "ground_truth": 0}, {"key": "37935687", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526302448534, "ground_truth": 0}, {"key": "37935687", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199773832536, "ground_truth": 0}, {"key": "37935687", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.842863141021408, "ground_truth": 0}, {"key": "37935687", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.930962076190535, "ground_truth": 0}, {"key": "37935687", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9092645085171751, "ground_truth": 0}, {"key": "40260829", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.796925379781053, "ground_truth": 0}, {"key": "40260829", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8643104576088267, "ground_truth": 0}, {"key": "40260829", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.900529780435741, "ground_truth": 0}, {"key": "40260829", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528043803419, "ground_truth": 0}, {"key": "40260829", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545531766494, "ground_truth": 0}, {"key": "36478199", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493163362888, "ground_truth": 0}, {"key": "36478199", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8539127565511464, "ground_truth": 0}, {"key": "36478199", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7662936339725279, "ground_truth": 0}, {"key": "36478199", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526127348947, "ground_truth": 0}, {"key": "36478199", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846486448697, "ground_truth": 0}, {"key": "34541803", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7969253707422903, "ground_truth": 0}, {"key": "34541803", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8509647007788091, "ground_truth": 0}, {"key": "34541803", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7853085823172684, "ground_truth": 0}, {"key": "34541803", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.876634379447514, "ground_truth": 0}, {"key": "34541803", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240938117284, "ground_truth": 0}, {"key": "35360841", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9092645102364184, "ground_truth": 0}, {"key": "35360841", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8976952966593937, "ground_truth": 0}, {"key": "35360841", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8548846486020938, "ground_truth": 0}, {"key": "35360841", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213693697272, "ground_truth": 0}, {"key": "35360841", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105561849521, "ground_truth": 0}, {"key": "35550407", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585907580989, "ground_truth": 0}, {"key": "35550407", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7549149910206214, "ground_truth": 0}, {"key": "35550407", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6740504902843216, "ground_truth": 0}, {"key": "35550407", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754517671813, "ground_truth": 0}, {"key": "35550407", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976088861803555, "ground_truth": 0}, {"key": "37561590", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.700894791196715, "ground_truth": 0}, {"key": "37561590", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.651354848844535, "ground_truth": 0}, {"key": "37561590", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7826624884340337, "ground_truth": 0}, {"key": "37561590", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878520765392, "ground_truth": 0}, {"key": "37561590", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918323129677, "ground_truth": 0}, {"key": "39328843", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036018529918, "ground_truth": 0}, {"key": "39328843", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8643104539555712, "ground_truth": 0}, {"key": "39328843", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8856314728622947, "ground_truth": 0}, {"key": "39328843", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942146461238, "ground_truth": 0}, {"key": "39328843", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952975482347, "ground_truth": 0}, {"key": "35389665", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9635062364082723, "ground_truth": 0}, {"key": "35389665", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9690910418360249, "ground_truth": 0}, {"key": "35389665", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9658995742430805, "ground_truth": 0}, {"key": "35389665", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9706877686163944, "ground_truth": 0}, {"key": "35389665", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.971347330577483, "ground_truth": 0}, {"key": "33080187", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7918210752395366, "ground_truth": 0}, {"key": "33080187", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.77321638149621, "ground_truth": 0}, {"key": "33080187", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5506073687866134, "ground_truth": 0}, {"key": "33080187", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321697896784, "ground_truth": 0}, {"key": "33080187", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476575454353, "ground_truth": 0}, {"key": "38636995", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.804405903225228, "ground_truth": 0}, {"key": "38636995", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8354835409779489, "ground_truth": 0}, {"key": "38636995", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215237566786, "ground_truth": 0}, {"key": "38636995", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366511528083, "ground_truth": 0}, {"key": "38636995", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767860572966, "ground_truth": 0}, {"key": "18536236", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.79944231025113, "ground_truth": 0}, {"key": "18536236", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.69925444608981, "ground_truth": 0}, {"key": "18536236", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7505527586548012, "ground_truth": 0}, {"key": "18536236", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601199869589, "ground_truth": 0}, {"key": "18536236", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743741892598, "ground_truth": 0}, {"key": "36289151", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7839884519569552, "ground_truth": 0}, {"key": "36289151", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6959583202399299, "ground_truth": 0}, {"key": "36289151", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.692641980091314, "ground_truth": 0}, {"key": "36289151", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.651354863595849, "ground_truth": 0}, {"key": "36289151", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563486288783, "ground_truth": 0}, {"key": "23017045", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8824278537786245, "ground_truth": 0}, {"key": "23017045", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9130583391701621, "ground_truth": 0}, {"key": "23017045", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8947894636216011, "ground_truth": 0}, {"key": "23017045", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377703736168, "ground_truth": 0}, {"key": "23017045", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9155072492966407, "ground_truth": 0}, {"key": "36418082", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6584174963320835, "ground_truth": 0}, {"key": "36418082", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8459424474276126, "ground_truth": 0}, {"key": "36418082", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8164063914114738, "ground_truth": 0}, {"key": "36418082", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163787979215, "ground_truth": 0}, {"key": "36418082", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311994676265, "ground_truth": 0}, {"key": "34396551", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7371581743663175, "ground_truth": 0}, {"key": "34396551", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619418141975, "ground_truth": 0}, {"key": "34396551", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6976089140281823, "ground_truth": 0}, {"key": "34396551", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013826106227, "ground_truth": 0}, {"key": "34396551", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615942886975, "ground_truth": 0}, {"key": "39720944", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.892562530950386, "ground_truth": 0}, {"key": "39720944", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.936749473093266, "ground_truth": 0}, {"key": "39720944", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9105453972660094, "ground_truth": 0}, {"key": "39720944", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110397461355, "ground_truth": 0}, {"key": "39720944", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.933430808871108, "ground_truth": 0}, {"key": "35884842", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6352224304350408, "ground_truth": 0}, {"key": "35884842", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7490872058829334, "ground_truth": 0}, {"key": "35884842", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6388352860819274, "ground_truth": 0}, {"key": "35884842", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365681024036, "ground_truth": 0}, {"key": "35884842", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787038915228, "ground_truth": 0}, {"key": "35403375", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6548947562051582, "ground_truth": 0}, {"key": "35403375", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7264256058777543, "ground_truth": 0}, {"key": "35403375", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6859494338543425, "ground_truth": 0}, {"key": "35403375", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389952618545, "ground_truth": 0}, {"key": "35403375", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995908868705, "ground_truth": 0}, {"key": "26341324", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8840392921577407, "ground_truth": 0}, {"key": "26341324", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8984105462768285, "ground_truth": 0}, {"key": "26341324", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8499711824296414, "ground_truth": 0}, {"key": "26341324", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037323695037, "ground_truth": 0}, {"key": "26341324", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185900471395, "ground_truth": 0}, {"key": "19212345", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036157390572, "ground_truth": 0}, {"key": "19212345", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8418256419804984, "ground_truth": 0}, {"key": "19212345", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637464586031, "ground_truth": 0}, {"key": "19212345", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325050245245, "ground_truth": 0}, {"key": "19212345", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582581586505, "ground_truth": 0}, {"key": "30548367", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163637222244, "ground_truth": 0}, {"key": "30548367", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8688267731851648, "ground_truth": 0}, {"key": "30548367", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8187367989163156, "ground_truth": 0}, {"key": "30548367", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105497951818, "ground_truth": 0}, {"key": "30548367", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767994199266, "ground_truth": 0}, {"key": "37919402", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9111797152126832, "ground_truth": 0}, {"key": "37919402", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.924687693058358, "ground_truth": 0}, {"key": "37919402", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9099070123752366, "ground_truth": 0}, {"key": "37919402", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.928926336757027, "ground_truth": 0}, {"key": "37919402", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.928408801994929, "ground_truth": 0}, {"key": "39995133", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204065060265, "ground_truth": 0}, {"key": "39995133", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8187367886026161, "ground_truth": 0}, {"key": "39995133", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9235923237560811, "ground_truth": 0}, {"key": "39995133", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473821280558, "ground_truth": 0}, {"key": "39995133", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789207259939, "ground_truth": 0}, {"key": "40249088", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6315943037840537, "ground_truth": 0}, {"key": "40249088", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8289388254442072, "ground_truth": 0}, {"key": "40249088", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7606506606239674, "ground_truth": 0}, {"key": "40249088", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.74613899601595, "ground_truth": 0}, {"key": "40249088", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118759604136, "ground_truth": 0}, {"key": "40254388", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7461389813586988, "ground_truth": 0}, {"key": "40254388", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233283900991866, "ground_truth": 0}, {"key": "40254388", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7549149925265494, "ground_truth": 0}, {"key": "40254388", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281502270686, "ground_truth": 0}, {"key": "40254388", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367928275734, "ground_truth": 0}, {"key": "31995230", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.896251369545542, "ground_truth": 0}, {"key": "31995230", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8333245775905292, "ground_truth": 0}, {"key": "31995230", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8643104555980069, "ground_truth": 0}, {"key": "31995230", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240724527218, "ground_truth": 0}, {"key": "31995230", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086179017149224, "ground_truth": 0}, {"key": "38632129", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9664104913828959, "ground_truth": 0}, {"key": "38632129", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9686195697437349, "ground_truth": 0}, {"key": "38632129", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9766692317018086, "ground_truth": 0}, {"key": "38632129", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9492946338593634, "ground_truth": 0}, {"key": "38632129", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9671630443399343, "ground_truth": 0}, {"key": "35720795", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8469578339579843, "ground_truth": 0}, {"key": "35720795", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.831143049743859, "ground_truth": 0}, {"key": "35720795", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8489721904223074, "ground_truth": 0}, {"key": "35720795", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.892562535697194, "ground_truth": 0}, {"key": "35720795", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.689305645982427, "ground_truth": 0}, {"key": "23906759", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9594592576733442, "ground_truth": 0}, {"key": "23906759", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9136765300722017, "ground_truth": 0}, {"key": "23906759", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9367494755738207, "ground_truth": 0}, {"key": "23906759", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9294404007397054, "ground_truth": 0}, {"key": "23906759", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429286030446498, "ground_truth": 0}, {"key": "19410108", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7969253674968202, "ground_truth": 0}, {"key": "19410108", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9032942169144271, "ground_truth": 0}, {"key": "19410108", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592254106753283, "ground_truth": 0}, {"key": "19410108", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740010662293, "ground_truth": 0}, {"key": "19410108", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511417686663, "ground_truth": 0}, {"key": "30745137", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.749087192902561, "ground_truth": 0}, {"key": "30745137", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898491120215, "ground_truth": 0}, {"key": "30745137", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8539127423222086, "ground_truth": 0}, {"key": "30745137", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947369809891, "ground_truth": 0}, {"key": "30745137", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916260722738, "ground_truth": 0}, {"key": "26553115", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6774740225721478, "ground_truth": 0}, {"key": "26553115", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7217432202210099, "ground_truth": 0}, {"key": "26553115", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6279512215701448, "ground_truth": 0}, {"key": "26553115", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593495302594, "ground_truth": 0}, {"key": "26553115", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743553238406, "ground_truth": 0}, {"key": "37872311", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.916708076340262, "ground_truth": 0}, {"key": "37872311", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7461389800714714, "ground_truth": 0}, {"key": "37872311", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619346086879, "ground_truth": 0}, {"key": "37872311", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392871067955, "ground_truth": 0}, {"key": "37872311", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346228113241, "ground_truth": 0}, {"key": "35553131", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9525741219357194, "ground_truth": 0}, {"key": "35553131", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.916708079297171, "ground_truth": 0}, {"key": "35553131", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7813305974113165, "ground_truth": 0}, {"key": "35553131", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105604926347, "ground_truth": 0}, {"key": "35553131", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377760372573, "ground_truth": 0}, {"key": "39038936", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324933199118, "ground_truth": 0}, {"key": "39038936", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7786493183112418, "ground_truth": 0}, {"key": "39038936", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7264256237092463, "ground_truth": 0}, {"key": "39038936", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215302224006, "ground_truth": 0}, {"key": "39038936", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056322001271465, "ground_truth": 0}, {"key": "38735486", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9678992909764476, "ground_truth": 0}, {"key": "38735486", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9695556483232994, "ground_truth": 0}, {"key": "38735486", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9785492720487854, "ground_truth": 0}, {"key": "38735486", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9612438054548779, "ground_truth": 0}, {"key": "38735486", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.977370798662638, "ground_truth": 0}, {"key": "17087845", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850296759646, "ground_truth": 0}, {"key": "17087845", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6808786175834649, "ground_truth": 0}, {"key": "17087845", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7446563242479023, "ground_truth": 0}, {"key": "17087845", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228811248625, "ground_truth": 0}, {"key": "17087845", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269108650617, "ground_truth": 0}, {"key": "37443011", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7201715293598997, "ground_truth": 0}, {"key": "37443011", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085634675223, "ground_truth": 0}, {"key": "37443011", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7185944060820209, "ground_truth": 0}, {"key": "37443011", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647126462904, "ground_truth": 0}, {"key": "37443011", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740051044924, "ground_truth": 0}, {"key": "36855749", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8198933379698169, "ground_truth": 0}, {"key": "36855749", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681173810594, "ground_truth": 0}, {"key": "36855749", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718434975167494, "ground_truth": 0}, {"key": "36855749", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581701300642, "ground_truth": 0}, {"key": "36855749", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802450066113, "ground_truth": 0}, {"key": "35613141", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9235923201053355, "ground_truth": 0}, {"key": "35613141", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9118099600421565, "ground_truth": 0}, {"key": "35613141", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8984105488013289, "ground_truth": 0}, {"key": "35613141", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9469902283819741, "ground_truth": 0}, {"key": "35613141", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284035627042, "ground_truth": 0}, {"key": "39088847", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675306483032, "ground_truth": 0}, {"key": "39088847", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5078118821473445, "ground_truth": 0}, {"key": "39088847", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8407825923562073, "ground_truth": 0}, {"key": "39088847", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585463162775, "ground_truth": 0}, {"key": "39088847", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059246905395, "ground_truth": 0}, {"key": "33197277", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7676898508696872, "ground_truth": 0}, {"key": "33197277", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8418256475628739, "ground_truth": 0}, {"key": "33197277", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8499711774245359, "ground_truth": 0}, {"key": "33197277", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253823944049, "ground_truth": 0}, {"key": "33197277", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647134985456, "ground_truth": 0}, {"key": "33815489", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7718434880986207, "ground_truth": 0}, {"key": "33815489", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324689867516, "ground_truth": 0}, {"key": "33815489", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7956580924203338, "ground_truth": 0}, {"key": "33815489", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528050189509, "ground_truth": 0}, {"key": "33815489", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.789233687063777, "ground_truth": 0}, {"key": "35862754", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9284088061772285, "ground_truth": 0}, {"key": "35862754", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.902609605197131, "ground_truth": 0}, {"key": "35862754", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.91429071906801, "ground_truth": 0}, {"key": "35862754", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206765060627, "ground_truth": 0}, {"key": "35862754", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122266475432, "ground_truth": 0}, {"key": "36080615", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.651354864121711, "ground_truth": 0}, {"key": "36080615", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026572887742, "ground_truth": 0}, {"key": "36080615", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6619228873876752, "ground_truth": 0}, {"key": "36080615", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105703958627, "ground_truth": 0}, {"key": "36080615", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056249750836, "ground_truth": 0}, {"key": "22822742", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892337072300376, "ground_truth": 0}, {"key": "22822742", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8407826064099967, "ground_truth": 0}, {"key": "22822742", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8947894681385338, "ground_truth": 0}, {"key": "22822742", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545657155937, "ground_truth": 0}, {"key": "22822742", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068741685565, "ground_truth": 0}, {"key": "39747536", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.935346511853577, "ground_truth": 0}, {"key": "39747536", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8519528148588862, "ground_truth": 0}, {"key": "39747536", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631539161388, "ground_truth": 0}, {"key": "39747536", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.956308941860711, "ground_truth": 0}, {"key": "39747536", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9507778834892017, "ground_truth": 0}, {"key": "34218396", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.913676521486393, "ground_truth": 0}, {"key": "34218396", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9019206763824598, "ground_truth": 0}, {"key": "34218396", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9184802520120613, "ground_truth": 0}, {"key": "34218396", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772401502234, "ground_truth": 0}, {"key": "34218396", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278666118134, "ground_truth": 0}, {"key": "39150388", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8661325121013065, "ground_truth": 0}, {"key": "39150388", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303137921659, "ground_truth": 0}, {"key": "39150388", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7505527724831126, "ground_truth": 0}, {"key": "39150388", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840439476897, "ground_truth": 0}, {"key": "39150388", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159323831709, "ground_truth": 0}, {"key": "28765782", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311942260605, "ground_truth": 0}, {"key": "28765782", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.849971173615416, "ground_truth": 0}, {"key": "28765782", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392839114708, "ground_truth": 0}, {"key": "28765782", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681103345292, "ground_truth": 0}, {"key": "28765782", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215318339502, "ground_truth": 0}, {"key": "35828022", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082673310043, "ground_truth": 0}, {"key": "35828022", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7577943740670949, "ground_truth": 0}, {"key": "35828022", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416424869981, "ground_truth": 0}, {"key": "35828022", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647993082788, "ground_truth": 0}, {"key": "35828022", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089081889265, "ground_truth": 0}, {"key": "27717735", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850341376297, "ground_truth": 0}, {"key": "27717735", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898547772913, "ground_truth": 0}, {"key": "27717735", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6460136929028766, "ground_truth": 0}, {"key": "27717735", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506523065747, "ground_truth": 0}, {"key": "27717735", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527705731819, "ground_truth": 0}, {"key": "37977826", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5945512398439219, "ground_truth": 0}, {"key": "37977826", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.581303083806379, "ground_truth": 0}, {"key": "37977826", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.651354859456536, "ground_truth": 0}, {"key": "37977826", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191295661107, "ground_truth": 0}, {"key": "37977826", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.653126928873269, "ground_truth": 0}, {"key": "31768588", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9575961735753434, "ground_truth": 0}, {"key": "31768588", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9235923196757934, "ground_truth": 0}, {"key": "31768588", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9252299550581551, "ground_truth": 0}, {"key": "31768588", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9334308142440693, "ground_truth": 0}, {"key": "31768588", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425257853679, "ground_truth": 0}, {"key": "37183351", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5813031110881514, "ground_truth": 0}, {"key": "37183351", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6513548729807361, "ground_truth": 0}, {"key": "37183351", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6548947682243804, "ground_truth": 0}, {"key": "37183351", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251104964071, "ground_truth": 0}, {"key": "37183351", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300585457894, "ground_truth": 0}, {"key": "39622090", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.848972191945267, "ground_truth": 0}, {"key": "39622090", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673239504823, "ground_truth": 0}, {"key": "39622090", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528097011239, "ground_truth": 0}, {"key": "39622090", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239890049536, "ground_truth": 0}, {"key": "39622090", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215419004995, "ground_truth": 0}, {"key": "39272756", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185943966894485, "ground_truth": 0}, {"key": "39272756", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6654105679564302, "ground_truth": 0}, {"key": "39272756", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5621765192058717, "ground_truth": 0}, {"key": "39272756", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544344134304, "ground_truth": 0}, {"key": "39272756", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195285163299, "ground_truth": 0}, {"key": "32138822", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850178169529, "ground_truth": 0}, {"key": "32138822", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.822189128401492, "ground_truth": 0}, {"key": "32138822", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6909762732173246, "ground_truth": 0}, {"key": "32138822", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528148325191, "ground_truth": 0}, {"key": "32138822", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666384519336, "ground_truth": 0}, {"key": "31070114", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4551986010581897, "ground_truth": 0}, {"key": "31070114", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.38861801501692445, "ground_truth": 0}, {"key": "31070114", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.37387582478134296, "ground_truth": 0}, {"key": "31070114", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990500200342, "ground_truth": 0}, {"key": "31070114", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438006410416773, "ground_truth": 0}, {"key": "39652762", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9294404046614478, "ground_truth": 0}, {"key": "39652762", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.939913352922203, "ground_truth": 0}, {"key": "39652762", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.907312224314323, "ground_truth": 0}, {"key": "39652762", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759604274858, "ground_truth": 0}, {"key": "39652762", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297924817478, "ground_truth": 0}, {"key": "33258866", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7606506647710921, "ground_truth": 0}, {"key": "33258866", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.746138996384211, "ground_truth": 0}, {"key": "33258866", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7138307709779181, "ground_truth": 0}, {"key": "33258866", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175096432854, "ground_truth": 0}, {"key": "33258866", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.69430265504076, "ground_truth": 0}, {"key": "36962388", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6584175140796924, "ground_truth": 0}, {"key": "36962388", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6959583529723414, "ground_truth": 0}, {"key": "36962388", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7341195097090606, "ground_truth": 0}, {"key": "36962388", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216368406376, "ground_truth": 0}, {"key": "36962388", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918254416453, "ground_truth": 0}, {"key": "32282272", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4804786853500807, "ground_truth": 0}, {"key": "32282272", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.44552954485196805, "ground_truth": 0}, {"key": "32282272", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6808786239408874, "ground_truth": 0}, {"key": "32282272", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713672468359984, "ground_truth": 0}, {"key": "32282272", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953612370806, "ground_truth": 0}, {"key": "36093072", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8872045947548038, "ground_truth": 0}, {"key": "36093072", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744913790246, "ground_truth": 0}, {"key": "36093072", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9149009502740015, "ground_truth": 0}, {"key": "36093072", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256536438039, "ground_truth": 0}, {"key": "36093072", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891368198098, "ground_truth": 0}, {"key": "38879972", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8376199560520983, "ground_truth": 0}, {"key": "38879972", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7839884733423381, "ground_truth": 0}, {"key": "38879972", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148210557599, "ground_truth": 0}, {"key": "38879972", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430479116819, "ground_truth": 0}, {"key": "38879972", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407826007622983, "ground_truth": 0}, {"key": "32106473", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8856314726206808, "ground_truth": 0}, {"key": "32106473", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9235923159542957, "ground_truth": 0}, {"key": "32106473", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8774767741355329, "ground_truth": 0}, {"key": "32106473", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352755114407, "ground_truth": 0}, {"key": "32106473", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.917893377617495, "ground_truth": 0}, {"key": "40415815", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6388352967500056, "ground_truth": 0}, {"key": "40415815", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.613236567263093, "ground_truth": 0}, {"key": "40415815", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.554470478974163, "ground_truth": 0}, {"key": "40415815", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786181911604, "ground_truth": 0}, {"key": "40415815", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792192696688, "ground_truth": 0}, {"key": "34581918", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.735641622652006, "ground_truth": 0}, {"key": "34581918", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8198933268926692, "ground_truth": 0}, {"key": "34581918", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210775976527, "ground_truth": 0}, {"key": "34581918", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916057150735, "ground_truth": 0}, {"key": "34581918", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240904392066, "ground_truth": 0}, {"key": "33004157", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8438950978094991, "ground_truth": 0}, {"key": "33004157", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8333245936121227, "ground_truth": 0}, {"key": "33004157", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.833324604548314, "ground_truth": 0}, {"key": "33004157", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.863391609293324, "ground_truth": 0}, {"key": "33004157", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933316543147, "ground_truth": 0}, {"key": "30334943", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9563089352341065, "ground_truth": 0}, {"key": "30334943", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9343951643259417, "ground_truth": 0}, {"key": "30334943", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9026095980796526, "ground_truth": 0}, {"key": "30334943", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284087975150882, "ground_truth": 0}, {"key": "30334943", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907153378695, "ground_truth": 0}, {"key": "33280503", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6671476553355151, "ground_truth": 0}, {"key": "33280503", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7918210708115427, "ground_truth": 0}, {"key": "33280503", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6909762883974617, "ground_truth": 0}, {"key": "33280503", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321925201957, "ground_truth": 0}, {"key": "33280503", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646036766305, "ground_truth": 0}, {"key": "25726782", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9532750444008188, "ground_truth": 0}, {"key": "25726782", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8962513793413186, "ground_truth": 0}, {"key": "25726782", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9390248190202447, "ground_truth": 0}, {"key": "25726782", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9603611604384351, "ground_truth": 0}, {"key": "25726782", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9469902273053658, "ground_truth": 0}, {"key": "35479854", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163868111966, "ground_truth": 0}, {"key": "35479854", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.806852634740007, "ground_truth": 0}, {"key": "35479854", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006920174744029, "ground_truth": 0}, {"key": "35479854", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672110250753, "ground_truth": 0}, {"key": "35479854", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772392027306, "ground_truth": 0}, {"key": "32716226", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673127693641, "ground_truth": 0}, {"key": "32716226", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7969253809701488, "ground_truth": 0}, {"key": "32716226", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8140528020635558, "ground_truth": 0}, {"key": "32716226", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754642557897, "ground_truth": 0}, {"key": "32716226", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759770041624, "ground_truth": 0}, {"key": "37047554", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7520125541506593, "ground_truth": 0}, {"key": "37047554", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.70089480793867, "ground_truth": 0}, {"key": "37047554", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210441036222674, "ground_truth": 0}, {"key": "37047554", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990432415262, "ground_truth": 0}, {"key": "37047554", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195140201492, "ground_truth": 0}, {"key": "36565290", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8705972699985359, "ground_truth": 0}, {"key": "36565290", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545636555783, "ground_truth": 0}, {"key": "36565290", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324885482263, "ground_truth": 0}, {"key": "36565290", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206800765113, "ground_truth": 0}, {"key": "36565290", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204055207121, "ground_truth": 0}, {"key": "27758640", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8969755790212672, "ground_truth": 0}, {"key": "27758640", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7248702572728684, "ground_truth": 0}, {"key": "27758640", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8558511461113126, "ground_truth": 0}, {"key": "27758640", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711733825537, "ground_truth": 0}, {"key": "27758640", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.74465634266251, "ground_truth": 0}, {"key": "28897118", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9086178948727723, "ground_truth": 0}, {"key": "28897118", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267118092040195, "ground_truth": 0}, {"key": "28897118", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8856314762271236, "ground_truth": 0}, {"key": "28897118", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677468081228, "ground_truth": 0}, {"key": "28897118", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765208995049, "ground_truth": 0}, {"key": "38452661", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9149009494331488, "ground_truth": 0}, {"key": "38452661", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8969755838065125, "ground_truth": 0}, {"key": "38452661", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8333245966293111, "ground_truth": 0}, {"key": "38452661", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891468926411, "ground_truth": 0}, {"key": "38452661", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312077380689, "ground_truth": 0}, {"key": "38033492", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7371581799783763, "ground_truth": 0}, {"key": "38033492", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898638586156, "ground_truth": 0}, {"key": "38033492", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7310585486875081, "ground_truth": 0}, {"key": "38033492", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760347401758, "ground_truth": 0}, {"key": "38033492", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585918007316, "ground_truth": 0}, {"key": "35949555", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9585377241952827, "ground_truth": 0}, {"key": "35949555", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9726235114326561, "ground_truth": 0}, {"key": "35949555", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9358173529188288, "ground_truth": 0}, {"key": "35949555", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892708165821, "ground_truth": 0}, {"key": "35949555", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9600626885907834, "ground_truth": 0}, {"key": "15263826", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8539127532944922, "ground_truth": 0}, {"key": "15263826", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7041601436202568, "ground_truth": 0}, {"key": "15263826", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.893309401117312, "ground_truth": 0}, {"key": "15263826", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434958164475, "ground_truth": 0}, {"key": "15263826", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354645300675, "ground_truth": 0}, {"key": "37313866", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8164063766941794, "ground_truth": 0}, {"key": "37313866", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5195213491545061, "ground_truth": 0}, {"key": "37313866", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837624906525, "ground_truth": 0}, {"key": "37313866", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789086600285, "ground_truth": 0}, {"key": "37313866", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175220357645, "ground_truth": 0}, {"key": "13911157", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8791467725051821, "ground_truth": 0}, {"key": "13911157", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9149009634548964, "ground_truth": 0}, {"key": "13911157", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8864204069378121, "ground_truth": 0}, {"key": "13911157", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036190101902, "ground_truth": 0}, {"key": "13911157", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907236910377, "ground_truth": 0}, {"key": "39594894", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.665410565328817, "ground_truth": 0}, {"key": "39594894", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431679936066686, "ground_truth": 0}, {"key": "39594894", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6442251014119162, "ground_truth": 0}, {"key": "39594894", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241495671241, "ground_truth": 0}, {"key": "39594894", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.775944543927965, "ground_truth": 0}, {"key": "34096170", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.895522672409813, "ground_truth": 0}, {"key": "34096170", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998501120506, "ground_truth": 0}, {"key": "34096170", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8092759517719125, "ground_truth": 0}, {"key": "34096170", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897236593548, "ground_truth": 0}, {"key": "34096170", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303145056599, "ground_truth": 0}, {"key": "37891952", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9563089415658519, "ground_truth": 0}, {"key": "37891952", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9697854117402338, "ground_truth": 0}, {"key": "37891952", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9734434270641732, "ground_truth": 0}, {"key": "37891952", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9704646626143533, "ground_truth": 0}, {"key": "37891952", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582605360805, "ground_truth": 0}, {"key": "40186158", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8991213789935203, "ground_truth": 0}, {"key": "40186158", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.705785030487542, "ground_truth": 0}, {"key": "40186158", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366568335744, "ground_truth": 0}, {"key": "40186158", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321853167355, "ground_truth": 0}, {"key": "40186158", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306278295218, "ground_truth": 0}, {"key": "37049719", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082973579504, "ground_truth": 0}, {"key": "37049719", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8386797575009859, "ground_truth": 0}, {"key": "37049719", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933094005420815, "ground_truth": 0}, {"key": "37049719", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228324438568, "ground_truth": 0}, {"key": "37049719", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506634473971, "ground_truth": 0}, {"key": "34610504", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9376689573749838, "ground_truth": 0}, {"key": "34610504", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339550333687, "ground_truth": 0}, {"key": "34610504", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8198933421493981, "ground_truth": 0}, {"key": "34610504", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213766192193, "ground_truth": 0}, {"key": "34610504", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303207817178, "ground_truth": 0}, {"key": "37595429", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8221891246899234, "ground_truth": 0}, {"key": "37595429", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8300437683074877, "ground_truth": 0}, {"key": "37595429", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8365545576134293, "ground_truth": 0}, {"key": "37595429", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677632905135, "ground_truth": 0}, {"key": "37595429", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105608209187, "ground_truth": 0}, {"key": "29772670", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5448013962202195, "ground_truth": 0}, {"key": "29772670", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.702530039606356, "ground_truth": 0}, {"key": "29772670", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324924339965, "ground_truth": 0}, {"key": "29772670", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256154313781, "ground_truth": 0}, {"key": "29772670", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787013497576, "ground_truth": 0}, {"key": "36369872", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666516696792, "ground_truth": 0}, {"key": "36369872", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6132365201188048, "ground_truth": 0}, {"key": "36369872", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.566018537485514, "ground_truth": 0}, {"key": "36369872", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434966310744, "ground_truth": 0}, {"key": "36369872", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916149488666, "ground_truth": 0}, {"key": "34527433", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5370413825647198, "ground_truth": 0}, {"key": "34527433", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5869964335985869, "ground_truth": 0}, {"key": "34527433", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6619228691397527, "ground_truth": 0}, {"key": "34527433", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241413860861, "ground_truth": 0}, {"key": "34527433", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300355531051375, "ground_truth": 0}, {"key": "31111734", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8848377724076381, "ground_truth": 0}, {"key": "31111734", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8774767870452732, "ground_truth": 0}, {"key": "31111734", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8539127703773909, "ground_truth": 0}, {"key": "31111734", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185914485227, "ground_truth": 0}, {"key": "31111734", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045962527816, "ground_truth": 0}, {"key": "40303872", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6370307944073171, "ground_truth": 0}, {"key": "40303872", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7786492806164875, "ground_truth": 0}, {"key": "40303872", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7154239727933758, "ground_truth": 0}, {"key": "40303872", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593643609603, "ground_truth": 0}, {"key": "40303872", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804485934237, "ground_truth": 0}, {"key": "33653553", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7106282992553727, "ground_truth": 0}, {"key": "33653553", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324884639153, "ground_truth": 0}, {"key": "33653553", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.620621584116577, "ground_truth": 0}, {"key": "33653553", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331364737684, "ground_truth": 0}, {"key": "33653553", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506751505052, "ground_truth": 0}, {"key": "34404510", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8438951229194053, "ground_truth": 0}, {"key": "34404510", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7918210725186964, "ground_truth": 0}, {"key": "34404510", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.727975434848777, "ground_truth": 0}, {"key": "34404510", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068920625332, "ground_truth": 0}, {"key": "34404510", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432047153618, "ground_truth": 0}, {"key": "35568692", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6020616096979718, "ground_truth": 0}, {"key": "35568692", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5097643612954074, "ground_truth": 0}, {"key": "35568692", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6315943163940143, "ground_truth": 0}, {"key": "35568692", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850248221688, "ground_truth": 0}, {"key": "35568692", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020616118509106, "ground_truth": 0}, {"key": "39151664", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7772998478665408, "ground_truth": 0}, {"key": "39151664", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6495786289534303, "ground_truth": 0}, {"key": "39151664", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7505527609937, "ground_truth": 0}, {"key": "39151664", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935506827031, "ground_truth": 0}, {"key": "39151664", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279511989964015, "ground_truth": 0}, {"key": "37493670", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9928231178711572, "ground_truth": 0}, {"key": "37493670", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9952448001901325, "ground_truth": 0}, {"key": "37493670", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9937587404164036, "ground_truth": 0}, {"key": "37493670", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9946981050151594, "ground_truth": 0}, {"key": "37493670", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.991422515033, "ground_truth": 0}, {"key": "21935983", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082811390781, "ground_truth": 0}, {"key": "21935983", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7371581575564855, "ground_truth": 0}, {"key": "21935983", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7826624814795565, "ground_truth": 0}, {"key": "21935983", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.638835257682004, "ground_truth": 0}, {"key": "21935983", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526456768365, "ground_truth": 0}, {"key": "38174214", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8895288534759869, "ground_truth": 0}, {"key": "38174214", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8976953037160761, "ground_truth": 0}, {"key": "38174214", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9367494808133506, "ground_truth": 0}, {"key": "38174214", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9556514194471696, "ground_truth": 0}, {"key": "38174214", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9353465124377536, "ground_truth": 0}, {"key": "40319923", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9600626831394979, "ground_truth": 0}, {"key": "40319923", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9441768570555185, "ground_truth": 0}, {"key": "40319923", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933093997489715, "ground_truth": 0}, {"key": "40319923", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346268533571, "ground_truth": 0}, {"key": "40319923", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418157437439, "ground_truth": 0}, {"key": "36478264", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142480274306, "ground_truth": 0}, {"key": "36478264", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8832359922093894, "ground_truth": 0}, {"key": "36478264", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.881614911943696, "ground_truth": 0}, {"key": "36478264", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9278878054279659, "ground_truth": 0}, {"key": "36478264", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377654575377, "ground_truth": 0}, {"key": "11935769", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163754434935, "ground_truth": 0}, {"key": "11935769", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7233094586985517, "ground_truth": 0}, {"key": "11935769", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7138307685782802, "ground_truth": 0}, {"key": "11935769", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461390014820838, "ground_truth": 0}, {"key": "11935769", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601352462019, "ground_truth": 0}, {"key": "33373410", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.65489471872101, "ground_truth": 0}, {"key": "33373410", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5813031002885332, "ground_truth": 0}, {"key": "33373410", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.665410559346997, "ground_truth": 0}, {"key": "33373410", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819690029375, "ground_truth": 0}, {"key": "33373410", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011592726716, "ground_truth": 0}, {"key": "11130680", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8740772392173484, "ground_truth": 0}, {"key": "11130680", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8969755701532662, "ground_truth": 0}, {"key": "11130680", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592254053360332, "ground_truth": 0}, {"key": "11130680", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127639184528, "ground_truth": 0}, {"key": "11130680", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026095992378216, "ground_truth": 0}, {"key": "34868650", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6808786022107106, "ground_truth": 0}, {"key": "34868650", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5983121867141294, "ground_truth": 0}, {"key": "34868650", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7905303040305034, "ground_truth": 0}, {"key": "34868650", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434925462822, "ground_truth": 0}, {"key": "34868650", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197822632782, "ground_truth": 0}, {"key": "33960561", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142481441669, "ground_truth": 0}, {"key": "33960561", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7446563535778637, "ground_truth": 0}, {"key": "33960561", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104789039979912, "ground_truth": 0}, {"key": "33960561", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675318829637, "ground_truth": 0}, {"key": "33960561", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972663562397, "ground_truth": 0}, {"key": "22504858", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8848377672647237, "ground_truth": 0}, {"key": "22504858", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142417727411, "ground_truth": 0}, {"key": "22504858", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8633916047780117, "ground_truth": 0}, {"key": "22504858", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9213576189952534, "ground_truth": 0}, {"key": "22504858", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675324830552, "ground_truth": 0}, {"key": "32283530", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.77864931387371, "ground_truth": 0}, {"key": "32283530", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6334102639792154, "ground_truth": 0}, {"key": "32283530", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.774583362454652, "ground_truth": 0}, {"key": "32283530", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998972778608, "ground_truth": 0}, {"key": "32283530", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920229386256, "ground_truth": 0}, {"key": "38377099", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.874934611751961, "ground_truth": 0}, {"key": "38377099", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8902942169773703, "ground_truth": 0}, {"key": "38377099", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867724349586, "ground_truth": 0}, {"key": "38377099", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825889010706, "ground_truth": 0}, {"key": "38377099", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671346721339, "ground_truth": 0}, {"key": "36105123", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9433475707186341, "ground_truth": 0}, {"key": "36105123", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9666631763220797, "ground_truth": 0}, {"key": "36105123", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9702399037779004, "ground_truth": 0}, {"key": "36105123", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.957912275495962, "ground_truth": 0}, {"key": "36105123", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9623913625235291, "ground_truth": 0}, {"key": "33527826", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8289388099273974, "ground_truth": 0}, {"key": "33527826", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672196061266, "ground_truth": 0}, {"key": "33527826", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.85195279479889, "ground_truth": 0}, {"key": "33527826", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228522397374, "ground_truth": 0}, {"key": "33527826", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359827999101, "ground_truth": 0}, {"key": "32349891", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.906653115509725, "ground_truth": 0}, {"key": "32349891", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9416541603745807, "ground_truth": 0}, {"key": "32349891", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9376689625448633, "ground_truth": 0}, {"key": "32349891", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067216119194, "ground_truth": 0}, {"key": "32349891", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179862675224, "ground_truth": 0}, {"key": "34281974", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303153235744, "ground_truth": 0}, {"key": "34281974", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7295197817843374, "ground_truth": 0}, {"key": "34281974", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7606506495834375, "ground_truth": 0}, {"key": "34281974", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256010691935, "ground_truth": 0}, {"key": "34281974", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059357764081, "ground_truth": 0}, {"key": "29387866", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8140528054692471, "ground_truth": 0}, {"key": "29387866", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5467381437572755, "ground_truth": 0}, {"key": "29387866", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7563575354880124, "ground_truth": 0}, {"key": "29387866", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299755535892, "ground_truth": 0}, {"key": "29387866", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786208601303, "ground_truth": 0}, {"key": "35731925", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9873750516704337, "ground_truth": 0}, {"key": "35731925", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9793540682197599, "ground_truth": 0}, {"key": "35731925", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9778834094861864, "ground_truth": 0}, {"key": "35731925", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9891815514837543, "ground_truth": 0}, {"key": "35731925", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.981310692670064, "ground_truth": 0}, {"key": "38829733", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281592443119, "ground_truth": 0}, {"key": "38829733", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.822189127828689, "ground_truth": 0}, {"key": "38829733", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8386797652121217, "ground_truth": 0}, {"key": "38829733", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085745025051, "ground_truth": 0}, {"key": "38829733", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759773397957, "ground_truth": 0}, {"key": "24624736", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267117900517891, "ground_truth": 0}, {"key": "24624736", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8633916060354058, "ground_truth": 0}, {"key": "24624736", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867878221152, "ground_truth": 0}, {"key": "24624736", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943930732852, "ground_truth": 0}, {"key": "24624736", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493204715239, "ground_truth": 0}, {"key": "36928562", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.987472067610517, "ground_truth": 0}, {"key": "36928562", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9864678512339308, "ground_truth": 0}, {"key": "36928562", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9796676461852746, "ground_truth": 0}, {"key": "36928562", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9930961616204076, "ground_truth": 0}, {"key": "36928562", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9830850860723416, "ground_truth": 0}, {"key": "34941119", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6943026680056533, "ground_truth": 0}, {"key": "34941119", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666532360546, "ground_truth": 0}, {"key": "34941119", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210644612923, "ground_truth": 0}, {"key": "34941119", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283990007544, "ground_truth": 0}, {"key": "34941119", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.753466659846707, "ground_truth": 0}, {"key": "30206231", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437561318332, "ground_truth": 0}, {"key": "30206231", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324881151853, "ground_truth": 0}, {"key": "30206231", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5813030704037291, "ground_truth": 0}, {"key": "30206231", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358297656441, "ground_truth": 0}, {"key": "30206231", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936563037865, "ground_truth": 0}, {"key": "35584972", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.68930562576329, "ground_truth": 0}, {"key": "35584972", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.73411954243854, "ground_truth": 0}, {"key": "35584972", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.548673503759271, "ground_truth": 0}, {"key": "35584972", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324807482563, "ground_truth": 0}, {"key": "35584972", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563500917991, "ground_truth": 0}, {"key": "39277709", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8244619313525476, "ground_truth": 0}, {"key": "39277709", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8749346233935013, "ground_truth": 0}, {"key": "39277709", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587975529392, "ground_truth": 0}, {"key": "39277709", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215149105458, "ground_truth": 0}, {"key": "39277709", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059592480638, "ground_truth": 0}, {"key": "36123657", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9136765212890501, "ground_truth": 0}, {"key": "36123657", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8976952963963528, "ground_truth": 0}, {"key": "36123657", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8925625165934541, "ground_truth": 0}, {"key": "36123657", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837704351736, "ground_truth": 0}, {"key": "36123657", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467669498272, "ground_truth": 0}, {"key": "33363938", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8740772407729831, "ground_truth": 0}, {"key": "33363938", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424325004841823, "ground_truth": 0}, {"key": "33363938", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8791467646076058, "ground_truth": 0}, {"key": "33363938", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9433475785885639, "ground_truth": 0}, {"key": "33363938", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513693843692, "ground_truth": 0}, {"key": "37349129", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357623414617, "ground_truth": 0}, {"key": "37349129", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392917386195, "ground_truth": 0}, {"key": "37349129", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9309620773965835, "ground_truth": 0}, {"key": "37349129", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772460717257, "ground_truth": 0}, {"key": "37349129", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.809275977955295, "ground_truth": 0}, {"key": "37160199", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7170118634031504, "ground_truth": 0}, {"key": "37160199", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6619228605889412, "ground_truth": 0}, {"key": "37160199", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5640984713778395, "ground_truth": 0}, {"key": "37160199", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942985373535, "ground_truth": 0}, {"key": "37160199", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315942864572791, "ground_truth": 0}, {"key": "35891053", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9284088042157856, "ground_truth": 0}, {"key": "35891053", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9196425373555708, "ground_truth": 0}, {"key": "35891053", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9394706123866483, "ground_truth": 0}, {"key": "35891053", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9529258239187839, "ground_truth": 0}, {"key": "35891053", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437151315366, "ground_truth": 0}, {"key": "40694542", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9092645063625354, "ground_truth": 0}, {"key": "40694542", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392771580062, "ground_truth": 0}, {"key": "40694542", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.909907005367025, "ground_truth": 0}, {"key": "40694542", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9465966732761922, "ground_truth": 0}, {"key": "40694542", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068845584658, "ground_truth": 0}, {"key": "24645770", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.796925372940363, "ground_truth": 0}, {"key": "24645770", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8428631444533785, "ground_truth": 0}, {"key": "24645770", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8407825961133729, "ground_truth": 0}, {"key": "24645770", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.826711797750535, "ground_truth": 0}, {"key": "24645770", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528221915438, "ground_truth": 0}, {"key": "37974587", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8807970738025982, "ground_truth": 0}, {"key": "37974587", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.926303737984798, "ground_truth": 0}, {"key": "37974587", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8652240804188543, "ground_truth": 0}, {"key": "37974587", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.847967763185884, "ground_truth": 0}, {"key": "37974587", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970610084842, "ground_truth": 0}, {"key": "40354149", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9376689587770345, "ground_truth": 0}, {"key": "40354149", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9339146171983492, "ground_truth": 0}, {"key": "40354149", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9669140181441268, "ground_truth": 0}, {"key": "40354149", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898269995229, "ground_truth": 0}, {"key": "40354149", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9376689609051881, "ground_truth": 0}, {"key": "35519470", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6909763065440092, "ground_truth": 0}, {"key": "35519470", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6495785879420426, "ground_truth": 0}, {"key": "35519470", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6424324709582374, "ground_truth": 0}, {"key": "35519470", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.540923877356554, "ground_truth": 0}, {"key": "35519470", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548933640496, "ground_truth": 0}, {"key": "36185624", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7248702837150023, "ground_truth": 0}, {"key": "36185624", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7918210591049463, "ground_truth": 0}, {"key": "36185624", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324942446476, "ground_truth": 0}, {"key": "36185624", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228300946618, "ground_truth": 0}, {"key": "36185624", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423060230345, "ground_truth": 0}, {"key": "39306113", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.689305633396526, "ground_truth": 0}, {"key": "39306113", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6370308014387173, "ground_truth": 0}, {"key": "39306113", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7606506529361445, "ground_truth": 0}, {"key": "39306113", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916144603372, "ground_truth": 0}, {"key": "39306113", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737637818258, "ground_truth": 0}, {"key": "19347718", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7505527485714913, "ground_truth": 0}, {"key": "19347718", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6548947393794752, "ground_truth": 0}, {"key": "19347718", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6808786349101569, "ground_truth": 0}, {"key": "19347718", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256048387097, "ground_truth": 0}, {"key": "19347718", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321692017043, "ground_truth": 0}, {"key": "21870064", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7416740278870365, "ground_truth": 0}, {"key": "21870064", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6279512145106655, "ground_truth": 0}, {"key": "21870064", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581692240686, "ground_truth": 0}, {"key": "21870064", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702625600482, "ground_truth": 0}, {"key": "21870064", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.775944556274108, "ground_truth": 0}, {"key": "37675776", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9053222964016999, "ground_truth": 0}, {"key": "37675776", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.915507248921993, "ground_truth": 0}, {"key": "37675776", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9252299663746919, "ground_truth": 0}, {"key": "37675776", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.92683527215716, "ground_truth": 0}, {"key": "37675776", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.948154534873116, "ground_truth": 0}, {"key": "38107017", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6057990296780654, "ground_truth": 0}, {"key": "38107017", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898524152, "ground_truth": 0}, {"key": "38107017", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7295197862577711, "ground_truth": 0}, {"key": "38107017", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197677577099, "ground_truth": 0}, {"key": "38107017", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241430136827, "ground_truth": 0}, {"key": "40046472", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6791787113383732, "ground_truth": 0}, {"key": "40046472", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6150878400885921, "ground_truth": 0}, {"key": "40046472", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7745833920899722, "ground_truth": 0}, {"key": "40046472", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512441575433, "ground_truth": 0}, {"key": "40046472", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737579241644, "ground_truth": 0}, {"key": "32157820", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036203354217, "ground_truth": 0}, {"key": "32157820", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672148650959, "ground_truth": 0}, {"key": "32157820", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7648916198067125, "ground_truth": 0}, {"key": "32157820", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.851952800930196, "ground_truth": 0}, {"key": "32157820", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434937276806, "ground_truth": 0}, {"key": "41004037", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5525397224981816, "ground_truth": 0}, {"key": "41004037", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6224593412226505, "ground_truth": 0}, {"key": "41004037", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5698526746372115, "ground_truth": 0}, {"key": "41004037", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094605299288, "ground_truth": 0}, {"key": "41004037", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004213777418, "ground_truth": 0}, {"key": "21387993", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6039318330416183, "ground_truth": 0}, {"key": "21387993", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672131816142, "ground_truth": 0}, {"key": "21387993", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5717665967192477, "ground_truth": 0}, {"key": "21387993", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228626885412, "ground_truth": 0}, {"key": "21387993", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089210416905, "ground_truth": 0}, {"key": "34665539", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493024656448, "ground_truth": 0}, {"key": "34665539", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8092759775144304, "ground_truth": 0}, {"key": "34665539", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6548947235428576, "ground_truth": 0}, {"key": "34665539", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303256113189, "ground_truth": 0}, {"key": "34665539", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690664693651, "ground_truth": 0}, {"key": "37872111", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.644225094087145, "ground_truth": 0}, {"key": "37872111", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6020615725983814, "ground_truth": 0}, {"key": "37872111", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743564841141, "ground_truth": 0}, {"key": "37872111", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291022522698, "ground_truth": 0}, {"key": "37872111", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647965290153, "ground_truth": 0}, {"key": "36629542", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152325116189251, "ground_truth": 0}, {"key": "36629542", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159566161469, "ground_truth": 0}, {"key": "36629542", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799928946265959, "ground_truth": 0}, {"key": "36629542", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224385153376, "ground_truth": 0}, {"key": "36629542", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647820545047, "ground_truth": 0}, {"key": "36487527", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9268352813661936, "ground_truth": 0}, {"key": "36487527", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4941409063428842, "ground_truth": 0}, {"key": "36487527", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8615382223279882, "ground_truth": 0}, {"key": "36487527", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9246876930699072, "ground_truth": 0}, {"key": "36487527", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583495578253, "ground_truth": 0}, {"key": "37344756", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8732148239304645, "ground_truth": 0}, {"key": "37344756", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8947894678325783, "ground_truth": 0}, {"key": "37344756", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9012274122214221, "ground_truth": 0}, {"key": "37344756", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358067207172, "ground_truth": 0}, {"key": "37344756", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424347104871, "ground_truth": 0}, {"key": "38707722", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526279146893, "ground_truth": 0}, {"key": "38707722", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300485000109, "ground_truth": 0}, {"key": "38707722", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6169358427030677, "ground_truth": 0}, {"key": "38707722", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976088935323197, "ground_truth": 0}, {"key": "38707722", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956581056012068, "ground_truth": 0}, {"key": "37093419", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6671476610013392, "ground_truth": 0}, {"key": "37093419", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4532618442866157, "ground_truth": 0}, {"key": "37093419", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5926665975020826, "ground_truth": 0}, {"key": "37093419", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.69595830680046, "ground_truth": 0}, {"key": "37093419", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762981549176, "ground_truth": 0}, {"key": "35547391", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9012274085501538, "ground_truth": 0}, {"key": "35547391", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8300437623355008, "ground_truth": 0}, {"key": "35547391", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8879840447041696, "ground_truth": 0}, {"key": "35547391", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068865669398, "ground_truth": 0}, {"key": "35547391", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215422682651, "ground_truth": 0}, {"key": "37173168", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511328569186, "ground_truth": 0}, {"key": "37173168", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526347390964, "ground_truth": 0}, {"key": "37173168", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8723473822286324, "ground_truth": 0}, {"key": "37173168", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526087096342, "ground_truth": 0}, {"key": "37173168", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122952864067, "ground_truth": 0}, {"key": "30725298", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7386690788678348, "ground_truth": 0}, {"key": "30725298", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760460694273, "ground_truth": 0}, {"key": "30725298", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.833324583390741, "ground_truth": 0}, {"key": "30725298", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337023447897, "ground_truth": 0}, {"key": "30725298", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300554397194, "ground_truth": 0}, {"key": "33830573", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8799743754858061, "ground_truth": 0}, {"key": "33830573", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085821548144, "ground_truth": 0}, {"key": "33830573", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637420712204, "ground_truth": 0}, {"key": "33830573", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240873728285, "ground_truth": 0}, {"key": "33830573", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577680993033562, "ground_truth": 0}, {"key": "33415474", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5331543794300218, "ground_truth": 0}, {"key": "33415474", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5039061762032696, "ground_truth": 0}, {"key": "33415474", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.3451052747661677, "ground_truth": 0}, {"key": "33415474", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704778305478, "ground_truth": 0}, {"key": "33415474", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764898208332, "ground_truth": 0}, {"key": "37383994", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.925229959317558, "ground_truth": 0}, {"key": "37383994", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9407897499674316, "ground_truth": 0}, {"key": "37383994", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9343951613684428, "ground_truth": 0}, {"key": "37383994", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9399133561004547, "ground_truth": 0}, {"key": "37383994", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099602168802, "ground_truth": 0}, {"key": "38576819", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.884039290175522, "ground_truth": 0}, {"key": "38576819", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8558511502280559, "ground_truth": 0}, {"key": "38576819", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8799743729132028, "ground_truth": 0}, {"key": "38576819", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942068171943, "ground_truth": 0}, {"key": "38576819", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.874077226957065, "ground_truth": 0}, {"key": "34500226", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.70740469266083, "ground_truth": 0}, {"key": "34500226", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680354384168, "ground_truth": 0}, {"key": "34500226", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7648916272674984, "ground_truth": 0}, {"key": "34500226", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909763189541903, "ground_truth": 0}, {"key": "34500226", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336975952988, "ground_truth": 0}, {"key": "39856394", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210441138236239, "ground_truth": 0}, {"key": "39856394", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8519528050275762, "ground_truth": 0}, {"key": "39856394", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148275856393, "ground_truth": 0}, {"key": "39856394", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744807390523, "ground_truth": 0}, {"key": "39856394", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283838976041, "ground_truth": 0}, {"key": "35499522", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.42632159576246836, "ground_truth": 0}, {"key": "35499522", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5888891415304139, "ground_truth": 0}, {"key": "35499522", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.35577487640183725, "ground_truth": 0}, {"key": "35499522", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544872482821565, "ground_truth": 0}, {"key": "35499522", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463120177824597, "ground_truth": 0}, {"key": "30157766", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675304265967, "ground_truth": 0}, {"key": "30157766", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8428631449797516, "ground_truth": 0}, {"key": "30157766", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672036324418, "ground_truth": 0}, {"key": "30157766", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213886753563, "ground_truth": 0}, {"key": "30157766", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300631867827, "ground_truth": 0}, {"key": "40472346", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849602755542, "ground_truth": 0}, {"key": "40472346", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7170118966340685, "ground_truth": 0}, {"key": "40472346", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7759445594013583, "ground_truth": 0}, {"key": "40472346", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666619224892, "ground_truth": 0}, {"key": "40472346", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059365698787, "ground_truth": 0}, {"key": "35305635", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.822189123969698, "ground_truth": 0}, {"key": "35305635", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619315495558, "ground_truth": 0}, {"key": "35305635", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.840782576587414, "ground_truth": 0}, {"key": "35305635", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970913951613, "ground_truth": 0}, {"key": "35305635", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513784354093, "ground_truth": 0}, {"key": "32495926", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8407825914672385, "ground_truth": 0}, {"key": "32495926", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303212670852, "ground_truth": 0}, {"key": "32495926", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8056321783701046, "ground_truth": 0}, {"key": "32495926", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366601661878, "ground_truth": 0}, {"key": "32495926", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744803409981, "ground_truth": 0}, {"key": "37353801", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585495613178, "ground_truth": 0}, {"key": "37353801", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6297745944813864, "ground_truth": 0}, {"key": "37353801", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.713830760543682, "ground_truth": 0}, {"key": "37353801", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159497649625, "ground_truth": 0}, {"key": "37353801", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281502331571, "ground_truth": 0}, {"key": "30159904", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8519528033190301, "ground_truth": 0}, {"key": "30159904", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.69925443922828, "ground_truth": 0}, {"key": "30159904", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8354835436007823, "ground_truth": 0}, {"key": "30159904", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104509050071, "ground_truth": 0}, {"key": "30159904", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.796925378296775, "ground_truth": 0}, {"key": "33698679", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6584175127448421, "ground_truth": 0}, {"key": "33698679", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7648916232674334, "ground_truth": 0}, {"key": "33698679", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849439329257, "ground_truth": 0}, {"key": "33698679", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.699254429121615, "ground_truth": 0}, {"key": "33698679", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549570230196, "ground_truth": 0}, {"key": "40530172", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9661559675284777, "ground_truth": 0}, {"key": "40530172", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8991213674012728, "ground_truth": 0}, {"key": "40530172", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9105454023806169, "ground_truth": 0}, {"key": "40530172", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009526779334, "ground_truth": 0}, {"key": "40530172", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9339146258696525, "ground_truth": 0}, {"key": "40652941", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8969755774227396, "ground_truth": 0}, {"key": "40652941", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7745833620701508, "ground_truth": 0}, {"key": "40652941", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8799743740731975, "ground_truth": 0}, {"key": "40652941", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.906653116055469, "ground_truth": 0}, {"key": "40652941", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.849971183307011, "ground_truth": 0}, {"key": "40122246", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9449947043784147, "ground_truth": 0}, {"key": "40122246", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8568123055834506, "ground_truth": 0}, {"key": "40122246", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.841825652150247, "ground_truth": 0}, {"key": "40122246", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228402636671, "ground_truth": 0}, {"key": "40122246", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631422120904, "ground_truth": 0}, {"key": "40032656", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8991213789150121, "ground_truth": 0}, {"key": "40032656", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8311430425674255, "ground_truth": 0}, {"key": "40032656", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849608257277, "ground_truth": 0}, {"key": "40032656", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647101705836, "ground_truth": 0}, {"key": "40032656", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218411741749, "ground_truth": 0}, {"key": "38913680", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6113819836157292, "ground_truth": 0}, {"key": "38913680", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6671477077518125, "ground_truth": 0}, {"key": "38913680", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6654105827314828, "ground_truth": 0}, {"key": "38913680", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575729853439, "ground_truth": 0}, {"key": "38913680", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105432639883, "ground_truth": 0}, {"key": "17608039", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5156199063909432, "ground_truth": 0}, {"key": "17608039", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6876299956158367, "ground_truth": 0}, {"key": "17608039", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581370280544, "ground_truth": 0}, {"key": "17608039", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711585733816, "ground_truth": 0}, {"key": "17608039", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118699706192, "ground_truth": 0}, {"key": "40434901", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8596637556959433, "ground_truth": 0}, {"key": "40434901", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7577943870672101, "ground_truth": 0}, {"key": "40434901", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8407825861242637, "ground_truth": 0}, {"key": "40434901", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099497874835, "ground_truth": 0}, {"key": "40434901", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267118017292664, "ground_truth": 0}, {"key": "37680058", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6388352628867838, "ground_truth": 0}, {"key": "37680058", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6842639992285249, "ground_truth": 0}, {"key": "37680058", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416452222349, "ground_truth": 0}, {"key": "37680058", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137063109868, "ground_truth": 0}, {"key": "37680058", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583124337816, "ground_truth": 0}, {"key": "37291821", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8031738024064815, "ground_truth": 0}, {"key": "37291821", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424324740016785, "ground_truth": 0}, {"key": "37291821", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6477982181777471, "ground_truth": 0}, {"key": "37291821", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786143810467, "ground_truth": 0}, {"key": "37291821", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321859863967, "ground_truth": 0}, {"key": "41002743", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7592253951332465, "ground_truth": 0}, {"key": "41002743", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8548846496934976, "ground_truth": 0}, {"key": "41002743", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8019358364040309, "ground_truth": 0}, {"key": "41002743", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303192437226, "ground_truth": 0}, {"key": "41002743", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358152267569, "ground_truth": 0}, {"key": "36322869", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8679338633930708, "ground_truth": 0}, {"key": "36322869", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142445845615, "ground_truth": 0}, {"key": "36322869", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933094124371551, "ground_truth": 0}, {"key": "36322869", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.908617895959617, "ground_truth": 0}, {"key": "36322869", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970819144061, "ground_truth": 0}, {"key": "39459717", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8969755704091993, "ground_truth": 0}, {"key": "39459717", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9348724472754613, "ground_truth": 0}, {"key": "39459717", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9046505328208848, "ground_truth": 0}, {"key": "39459717", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.873214828151273, "ground_truth": 0}, {"key": "39459717", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846317791368, "ground_truth": 0}, {"key": "36503727", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.677474027527991, "ground_truth": 0}, {"key": "36503727", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5448013758258381, "ground_truth": 0}, {"key": "36503727", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.49218811394876416, "ground_truth": 0}, {"key": "36503727", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872287027158, "ground_truth": 0}, {"key": "36503727", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789050733252, "ground_truth": 0}, {"key": "35682367", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7799928909509288, "ground_truth": 0}, {"key": "35682367", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8895288540952376, "ground_truth": 0}, {"key": "35682367", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6076631912959097, "ground_truth": 0}, {"key": "35682367", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445343234268, "ground_truth": 0}, {"key": "35682367", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056216202957, "ground_truth": 0}, {"key": "36472353", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976089188310504, "ground_truth": 0}, {"key": "36472353", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744752150627, "ground_truth": 0}, {"key": "36472353", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.49218812155786085, "ground_truth": 0}, {"key": "36472353", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953455904942, "ground_truth": 0}, {"key": "36472353", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419954173824, "ground_truth": 0}, {"key": "37651907", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7122321764279274, "ground_truth": 0}, {"key": "37651907", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526220867824, "ground_truth": 0}, {"key": "37651907", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6477982077664458, "ground_truth": 0}, {"key": "37651907", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.830043776998948, "ground_truth": 0}, {"key": "37651907", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389930401717, "ground_truth": 0}, {"key": "36255476", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601603980652, "ground_truth": 0}, {"key": "36255476", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5602526344788783, "ground_truth": 0}, {"key": "36255476", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6095241534186153, "ground_truth": 0}, {"key": "36255476", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216071752936, "ground_truth": 0}, {"key": "36255476", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746279027221, "ground_truth": 0}, {"key": "37283518", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9099070136232651, "ground_truth": 0}, {"key": "37283518", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339676728387, "ground_truth": 0}, {"key": "37283518", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8278281537515526, "ground_truth": 0}, {"key": "37283518", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281751153664, "ground_truth": 0}, {"key": "37283518", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759748479751, "ground_truth": 0}, {"key": "34906785", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7799928824103365, "ground_truth": 0}, {"key": "34906785", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8661325268860389, "ground_truth": 0}, {"key": "34906785", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7704647937619352, "ground_truth": 0}, {"key": "34906785", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872287184067, "ground_truth": 0}, {"key": "34906785", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089098360949, "ground_truth": 0}, {"key": "34965328", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8479677652505053, "ground_truth": 0}, {"key": "34965328", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8940517135248122, "ground_truth": 0}, {"key": "34965328", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159710533994, "ground_truth": 0}, {"key": "34965328", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424439488463, "ground_truth": 0}, {"key": "34965328", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675368223109, "ground_truth": 0}, {"key": "38788440", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5964331438064804, "ground_truth": 0}, {"key": "38788440", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6671476689932545, "ground_truth": 0}, {"key": "38788440", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5717666087783851, "ground_truth": 0}, {"key": "38788440", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850021303561, "ground_truth": 0}, {"key": "38788440", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689515987656, "ground_truth": 0}, {"key": "35046866", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8962513597685845, "ground_truth": 0}, {"key": "35046866", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531227534772, "ground_truth": 0}, {"key": "35046866", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8577681150903128, "ground_truth": 0}, {"key": "35046866", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026096050615955, "ground_truth": 0}, {"key": "35046866", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222961049024, "ground_truth": 0}, {"key": "37629558", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5583270226174578, "ground_truth": 0}, {"key": "37629558", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680172410602, "ground_truth": 0}, {"key": "37629558", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6297746263457348, "ground_truth": 0}, {"key": "37629558", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953634939173, "ground_truth": 0}, {"key": "37629558", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102525840568, "ground_truth": 0}, {"key": "33859914", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8397339547108514, "ground_truth": 0}, {"key": "33859914", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8558511439204964, "ground_truth": 0}, {"key": "33859914", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8679338471590861, "ground_truth": 0}, {"key": "33859914", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325148702844, "ground_truth": 0}, {"key": "33859914", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619528621097, "ground_truth": 0}, {"key": "39790523", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8529354926417095, "ground_truth": 0}, {"key": "39790523", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.770464771027611, "ground_truth": 0}, {"key": "39790523", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8976952946514039, "ground_truth": 0}, {"key": "39790523", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191268998121, "ground_truth": 0}, {"key": "39790523", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149109385119, "ground_truth": 0}, {"key": "33509656", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976088800395849, "ground_truth": 0}, {"key": "33509656", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7918210617341007, "ground_truth": 0}, {"key": "33509656", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.771843489610538, "ground_truth": 0}, {"key": "33509656", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432159412561, "ground_truth": 0}, {"key": "33509656", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548865214275, "ground_truth": 0}, {"key": "17380923", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8587185878431224, "ground_truth": 0}, {"key": "17380923", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8300437666122628, "ground_truth": 0}, {"key": "17380923", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9343951647438004, "ground_truth": 0}, {"key": "17380923", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972796626267, "ground_truth": 0}, {"key": "17380923", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388053297897, "ground_truth": 0}, {"key": "36202526", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493153441094, "ground_truth": 0}, {"key": "36202526", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8558511396118009, "ground_truth": 0}, {"key": "36202526", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7853085957585215, "ground_truth": 0}, {"key": "36202526", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837679834684, "ground_truth": 0}, {"key": "36202526", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163598264408, "ground_truth": 0}, {"key": "26419232", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5983121841138428, "ground_truth": 0}, {"key": "26419232", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5755880191118867, "ground_truth": 0}, {"key": "26419232", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6513548675301706, "ground_truth": 0}, {"key": "26419232", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527667538299, "ground_truth": 0}, {"key": "26419232", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737085000142, "ground_truth": 0}, {"key": "34232398", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.737158153591415, "ground_truth": 0}, {"key": "34232398", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531217130451, "ground_truth": 0}, {"key": "34232398", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7325918257831151, "ground_truth": 0}, {"key": "34232398", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437818743845, "ground_truth": 0}, {"key": "34232398", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339541247154, "ground_truth": 0}, {"key": "33586045", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.884837777176266, "ground_truth": 0}, {"key": "33586045", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.846957854905952, "ground_truth": 0}, {"key": "33586045", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7325918229145363, "ground_truth": 0}, {"key": "33586045", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672188766853, "ground_truth": 0}, {"key": "33586045", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835444189247, "ground_truth": 0}, {"key": "32281151", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8006920344726888, "ground_truth": 0}, {"key": "32281151", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7154240022913146, "ground_truth": 0}, {"key": "32281151", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760110801191, "ground_truth": 0}, {"key": "32281151", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104788923293487, "ground_truth": 0}, {"key": "32281151", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245914691694, "ground_truth": 0}, {"key": "37308159", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.912436159710365, "ground_truth": 0}, {"key": "37308159", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9246876947572971, "ground_truth": 0}, {"key": "37308159", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9241418192875656, "ground_truth": 0}, {"key": "37308159", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923165652757, "ground_truth": 0}, {"key": "37308159", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361539690585, "ground_truth": 0}, {"key": "35694408", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8856314816965382, "ground_truth": 0}, {"key": "35694408", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9155072487739264, "ground_truth": 0}, {"key": "35694408", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430619377289, "ground_truth": 0}, {"key": "35694408", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195233577454, "ground_truth": 0}, {"key": "35694408", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437832497362, "ground_truth": 0}, {"key": "39781995", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6774740146985481, "ground_truth": 0}, {"key": "39781995", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.661922859849141, "ground_truth": 0}, {"key": "39781995", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7620700925592951, "ground_truth": 0}, {"key": "39781995", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.763483760476763, "ground_truth": 0}, {"key": "39781995", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743648806367, "ground_truth": 0}, {"key": "22799372", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9309620745042692, "ground_truth": 0}, {"key": "22799372", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9518632305010771, "ground_truth": 0}, {"key": "22799372", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9241418117460632, "ground_truth": 0}, {"key": "22799372", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9458012723507914, "ground_truth": 0}, {"key": "22799372", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.964589270568602, "ground_truth": 0}, {"key": "37428240", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6150878612514841, "ground_truth": 0}, {"key": "37428240", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6601723832578912, "ground_truth": 0}, {"key": "37428240", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6740504704748689, "ground_truth": 0}, {"key": "37428240", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201715099886431, "ground_truth": 0}, {"key": "37428240", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666583054619, "ground_truth": 0}, {"key": "40612657", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887587970638435, "ground_truth": 0}, {"key": "40612657", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9219218297623106, "ground_truth": 0}, {"key": "40612657", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9073122238400511, "ground_truth": 0}, {"key": "40612657", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148287883631, "ground_truth": 0}, {"key": "40612657", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9473810449551657, "ground_truth": 0}, {"key": "34404662", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8376199630122918, "ground_truth": 0}, {"key": "34404662", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392813327043, "ground_truth": 0}, {"key": "34404662", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9066531213886437, "ground_truth": 0}, {"key": "34404662", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531282167949, "ground_truth": 0}, {"key": "34404662", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104598384268, "ground_truth": 0}, {"key": "32619704", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7446563584500902, "ground_truth": 0}, {"key": "32619704", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6808786283775765, "ground_truth": 0}, {"key": "32619704", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7676898561650798, "ground_truth": 0}, {"key": "32619704", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199701881226, "ground_truth": 0}, {"key": "32619704", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306208719009, "ground_truth": 0}, {"key": "39014883", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6460137104499162, "ground_truth": 0}, {"key": "39014883", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7217432276502717, "ground_truth": 0}, {"key": "39014883", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7759445313668215, "ground_truth": 0}, {"key": "39014883", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256127283796, "ground_truth": 0}, {"key": "39014883", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754508805191, "ground_truth": 0}, {"key": "37982812", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8910549535694067, "ground_truth": 0}, {"key": "37982812", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9626731123460414, "ground_truth": 0}, {"key": "37982812", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9546474177907993, "ground_truth": 0}, {"key": "37982812", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531222381985, "ground_truth": 0}, {"key": "37982812", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012691791714, "ground_truth": 0}, {"key": "28123476", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9309620745502312, "ground_truth": 0}, {"key": "28123476", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8799743695292767, "ground_truth": 0}, {"key": "28123476", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869971424888, "ground_truth": 0}, {"key": "28123476", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278680249985, "ground_truth": 0}, {"key": "28123476", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213786299622, "ground_truth": 0}, {"key": "39078849", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.713830764993259, "ground_truth": 0}, {"key": "39078849", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7217431834026002, "ground_truth": 0}, {"key": "39078849", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631417819313, "ground_truth": 0}, {"key": "39078849", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159419540666, "ground_truth": 0}, {"key": "39078849", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044058957105101, "ground_truth": 0}, {"key": "39414137", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9704646622951448, "ground_truth": 0}, {"key": "39414137", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.959459260126379, "ground_truth": 0}, {"key": "39414137", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9719924786821363, "ground_truth": 0}, {"key": "39414137", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9623913662079132, "ground_truth": 0}, {"key": "39414137", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9777138139565924, "ground_truth": 0}, {"key": "37371354", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6388352989545077, "ground_truth": 0}, {"key": "37371354", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.795658098242783, "ground_truth": 0}, {"key": "37371354", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.620621609900839, "ground_truth": 0}, {"key": "37371354", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125796104646, "ground_truth": 0}, {"key": "37371354", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615710925208, "ground_truth": 0}, {"key": "29497179", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8548846371198043, "ground_truth": 0}, {"key": "29497179", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8449215279573483, "ground_truth": 0}, {"key": "29497179", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.859663761533792, "ground_truth": 0}, {"key": "29497179", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346131246197, "ground_truth": 0}, {"key": "29497179", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929197633307, "ground_truth": 0}, {"key": "35908694", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.931959579306345, "ground_truth": 0}, {"key": "35908694", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9575961688043577, "ground_truth": 0}, {"key": "35908694", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9416541563736032, "ground_truth": 0}, {"key": "35908694", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9420819094313173, "ground_truth": 0}, {"key": "35908694", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9453993872195935, "ground_truth": 0}, {"key": "37619358", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6926419848477159, "ground_truth": 0}, {"key": "37619358", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8732148245093556, "ground_truth": 0}, {"key": "37619358", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8459424346221979, "ground_truth": 0}, {"key": "37619358", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9358173510824904, "ground_truth": 0}, {"key": "37619358", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117798384115, "ground_truth": 0}, {"key": "37293103", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8791467651477627, "ground_truth": 0}, {"key": "37293103", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8864204123913916, "ground_truth": 0}, {"key": "37293103", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392824742075, "ground_truth": 0}, {"key": "37293103", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9403530597385007, "ground_truth": 0}, {"key": "37293103", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632867340401, "ground_truth": 0}, {"key": "36883729", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7956580964849804, "ground_truth": 0}, {"key": "36883729", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8019358344890172, "ground_truth": 0}, {"key": "36883729", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.782662490123142, "ground_truth": 0}, {"key": "36883729", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210646295484, "ground_truth": 0}, {"key": "36883729", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647040764783, "ground_truth": 0}, {"key": "39209521", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489721760752834, "ground_truth": 0}, {"key": "39209521", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324864776698, "ground_truth": 0}, {"key": "39209521", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8879840316936075, "ground_truth": 0}, {"key": "39209521", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210654422057, "ground_truth": 0}, {"key": "39209521", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872046019440802, "ground_truth": 0}, {"key": "27792571", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7606506776748034, "ground_truth": 0}, {"key": "27792571", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7786492933949771, "ground_truth": 0}, {"key": "27792571", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6460136987780128, "ground_truth": 0}, {"key": "27792571", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392721516356, "ground_truth": 0}, {"key": "27792571", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118688766363, "ground_truth": 0}, {"key": "39755647", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7233094797280104, "ground_truth": 0}, {"key": "39755647", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8187368134098243, "ground_truth": 0}, {"key": "39755647", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8558511467598549, "ground_truth": 0}, {"key": "39755647", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085954303549, "ground_truth": 0}, {"key": "39755647", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748664686637, "ground_truth": 0}, {"key": "40800537", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6671476788734987, "ground_truth": 0}, {"key": "40800537", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199612593705, "ground_truth": 0}, {"key": "40800537", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.44360042527251836, "ground_truth": 0}, {"key": "40800537", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787077373135, "ground_truth": 0}, {"key": "40800537", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358321746614, "ground_truth": 0}, {"key": "14171461", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5039061822217135, "ground_truth": 0}, {"key": "14171461", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6926419799481188, "ground_truth": 0}, {"key": "14171461", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8255897108573159, "ground_truth": 0}, {"key": "14171461", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.737158188129812, "ground_truth": 0}, {"key": "14171461", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918067577066, "ground_truth": 0}, {"key": "36892440", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.806852612132949, "ground_truth": 0}, {"key": "36892440", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.844921525870594, "ground_truth": 0}, {"key": "36892440", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8832359877193482, "ground_truth": 0}, {"key": "36892440", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277829573, "ground_truth": 0}, {"key": "36892440", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085778965045, "ground_truth": 0}, {"key": "33733410", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.831143049714852, "ground_truth": 0}, {"key": "33733410", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8311430474598319, "ground_truth": 0}, {"key": "33733410", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799929029628255, "ground_truth": 0}, {"key": "33733410", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802429122546, "ground_truth": 0}, {"key": "33733410", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837684423835, "ground_truth": 0}, {"key": "38587765", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.46101680191916017, "ground_truth": 0}, {"key": "38587765", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.46879064996157954, "ground_truth": 0}, {"key": "38587765", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6406358486787983, "ground_truth": 0}, {"key": "38587765", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195801038409, "ground_truth": 0}, {"key": "38587765", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206337962579444, "ground_truth": 0}, {"key": "41065582", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7025300452028065, "ground_truth": 0}, {"key": "41065582", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8019358228871517, "ground_truth": 0}, {"key": "41065582", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6279512041806022, "ground_truth": 0}, {"key": "41065582", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493042106327, "ground_truth": 0}, {"key": "41065582", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163667630613, "ground_truth": 0}, {"key": "34713891", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7446563574868332, "ground_truth": 0}, {"key": "34713891", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6842640104452342, "ground_truth": 0}, {"key": "34713891", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637579580376, "ground_truth": 0}, {"key": "34713891", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754362769292, "ground_truth": 0}, {"key": "34713891", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984325037647, "ground_truth": 0}, {"key": "18913023", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867775675331, "ground_truth": 0}, {"key": "18913023", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8757869845719995, "ground_truth": 0}, {"key": "18913023", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8044059217921423, "ground_truth": 0}, {"key": "18913023", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.756357547976144, "ground_truth": 0}, {"key": "18913023", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646938823228, "ground_truth": 0}, {"key": "36884100", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6757646131355924, "ground_truth": 0}, {"key": "36884100", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.729519775074555, "ground_truth": 0}, {"key": "36884100", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6406358721961811, "ground_truth": 0}, {"key": "36884100", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883450858498, "ground_truth": 0}, {"key": "36884100", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468987294431, "ground_truth": 0}, {"key": "39899913", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210441171847104, "ground_truth": 0}, {"key": "39899913", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7549149944337564, "ground_truth": 0}, {"key": "39899913", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9059898168428006, "ground_truth": 0}, {"key": "39899913", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578387257072, "ground_truth": 0}, {"key": "39899913", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511502237097, "ground_truth": 0}, {"key": "30725366", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6150878433389234, "ground_truth": 0}, {"key": "30725366", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159626935345, "ground_truth": 0}, {"key": "30725366", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.616935828235463, "ground_truth": 0}, {"key": "30725366", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593397859215, "ground_truth": 0}, {"key": "30725366", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.638835293441023, "ground_truth": 0}, {"key": "26133523", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7416740250428836, "ground_truth": 0}, {"key": "26133523", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.732591835041488, "ground_truth": 0}, {"key": "26133523", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094774157325, "ground_truth": 0}, {"key": "26133523", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953505340432, "ground_truth": 0}, {"key": "26133523", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256080589978, "ground_truth": 0}, {"key": "29332665", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357580292449, "ground_truth": 0}, {"key": "29332665", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8732148331990826, "ground_truth": 0}, {"key": "29332665", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7416739974633857, "ground_truth": 0}, {"key": "29332665", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713669668321844, "ground_truth": 0}, {"key": "29332665", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185792608167, "ground_truth": 0}, {"key": "37400481", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9407897431690173, "ground_truth": 0}, {"key": "37400481", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.921921831629858, "ground_truth": 0}, {"key": "37400481", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9130583434839773, "ground_truth": 0}, {"key": "37400481", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274067412769, "ground_truth": 0}, {"key": "37400481", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952852563513, "ground_truth": 0}, {"key": "38787241", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6791786800977598, "ground_truth": 0}, {"key": "38787241", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7620701293385841, "ground_truth": 0}, {"key": "38787241", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8092759834226577, "ground_truth": 0}, {"key": "38787241", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700977220185, "ground_truth": 0}, {"key": "38787241", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118701042338, "ground_truth": 0}, {"key": "38225963", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585858340253, "ground_truth": 0}, {"key": "38225963", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7718435089364221, "ground_truth": 0}, {"key": "38225963", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7520125923301926, "ground_truth": 0}, {"key": "38225963", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358299091319, "ground_truth": 0}, {"key": "38225963", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036166859352, "ground_truth": 0}, {"key": "26072034", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.20434191036337587, "ground_truth": 0}, {"key": "26072034", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.24944722802120228, "ground_truth": 0}, {"key": "26072034", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.39047585718105493, "ground_truth": 0}, {"key": "26072034", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436621067368, "ground_truth": 0}, {"key": "26072034", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.2465333426167548, "ground_truth": 0}, {"key": "35690810", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.704160131388401, "ground_truth": 0}, {"key": "35690810", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8499711768759481, "ground_truth": 0}, {"key": "35690810", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8984105571676472, "ground_truth": 0}, {"key": "35690810", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631572338562, "ground_truth": 0}, {"key": "35690810", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059189468878, "ground_truth": 0}, {"key": "36855665", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9719924809896838, "ground_truth": 0}, {"key": "36855665", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9686195726191742, "ground_truth": 0}, {"key": "36855665", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9603611643947051, "ground_truth": 0}, {"key": "36855665", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9603611595805569, "ground_truth": 0}, {"key": "36855665", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9728307718100482, "ground_truth": 0}, {"key": "29757662", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195181425377, "ground_truth": 0}, {"key": "29757662", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545784682459, "ground_truth": 0}, {"key": "29757662", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7446563499701129, "ground_truth": 0}, {"key": "29757662", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321784738617, "ground_truth": 0}, {"key": "29757662", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593313005861, "ground_truth": 0}, {"key": "19134339", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5234203500698507, "ground_truth": 0}, {"key": "19134339", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7592253891258007, "ground_truth": 0}, {"key": "19134339", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5409238749544174, "ground_truth": 0}, {"key": "19134339", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995866204954, "ground_truth": 0}, {"key": "19134339", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.538983233513455, "ground_truth": 0}, {"key": "35360732", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9012274181690452, "ground_truth": 0}, {"key": "35360732", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8615382042445117, "ground_truth": 0}, {"key": "35360732", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9196425308619002, "ground_truth": 0}, {"key": "35360732", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392859934383, "ground_truth": 0}, {"key": "35360732", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578497690728, "ground_truth": 0}, {"key": "37713629", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6057990571724349, "ground_truth": 0}, {"key": "37713629", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8519528051761246, "ground_truth": 0}, {"key": "37713629", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5428632726927317, "ground_truth": 0}, {"key": "37713629", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891530123168, "ground_truth": 0}, {"key": "37713629", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708887413664, "ground_truth": 0}, {"key": "33393394", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8140527953236416, "ground_truth": 0}, {"key": "33393394", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8322366605101752, "ground_truth": 0}, {"key": "33393394", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7813306331028007, "ground_truth": 0}, {"key": "33393394", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094582621358, "ground_truth": 0}, {"key": "33393394", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593191332167, "ground_truth": 0}, {"key": "32275837", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9399133446575915, "ground_truth": 0}, {"key": "32275837", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9241418149837641, "ground_truth": 0}, {"key": "32275837", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8799743814047197, "ground_truth": 0}, {"key": "32275837", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357605087491, "ground_truth": 0}, {"key": "32275837", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226755098712, "ground_truth": 0}, {"key": "21458094", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6636689350834747, "ground_truth": 0}, {"key": "21458094", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6370308170250966, "ground_truth": 0}, {"key": "21458094", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867742155447, "ground_truth": 0}, {"key": "21458094", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549519940761, "ground_truth": 0}, {"key": "21458094", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476461298552, "ground_truth": 0}, {"key": "40975362", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9339146258239455, "ground_truth": 0}, {"key": "40975362", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9362850034679632, "ground_truth": 0}, {"key": "40975362", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9473810416939343, "ground_truth": 0}, {"key": "40975362", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923224990846, "ground_truth": 0}, {"key": "40975362", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9556514189851549, "ground_truth": 0}, {"key": "35234201", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8933094078191296, "ground_truth": 0}, {"key": "35234201", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9053222998796776, "ground_truth": 0}, {"key": "35234201", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339693920991, "ground_truth": 0}, {"key": "35234201", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122846108895, "ground_truth": 0}, {"key": "35234201", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382105110846, "ground_truth": 0}, {"key": "36037573", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8428631484486409, "ground_truth": 0}, {"key": "36037573", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9149009497589253, "ground_truth": 0}, {"key": "36037573", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256616027858, "ground_truth": 0}, {"key": "36037573", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392869302455, "ground_truth": 0}, {"key": "36037573", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199728036338, "ground_truth": 0}, {"key": "30861915", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9207896823896639, "ground_truth": 0}, {"key": "30861915", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8872045846346421, "ground_truth": 0}, {"key": "30861915", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.900529793041423, "ground_truth": 0}, {"key": "30861915", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080821660161, "ground_truth": 0}, {"key": "30861915", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.925229956633285, "ground_truth": 0}, {"key": "40173012", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6654105562448768, "ground_truth": 0}, {"key": "40173012", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6566582693001229, "ground_truth": 0}, {"key": "40173012", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.770464784997445, "ground_truth": 0}, {"key": "40173012", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512651028365, "ground_truth": 0}, {"key": "40173012", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593532728259, "ground_truth": 0}, {"key": "35100330", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5679366212707968, "ground_truth": 0}, {"key": "35100330", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5583269689517225, "ground_truth": 0}, {"key": "35100330", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6206215926596289, "ground_truth": 0}, {"key": "35100330", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953702376558, "ground_truth": 0}, {"key": "35100330", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174984051462, "ground_truth": 0}, {"key": "37220221", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9224823427045172, "ground_truth": 0}, {"key": "37220221", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9522199368053078, "ground_truth": 0}, {"key": "37220221", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9079671390833252, "ground_truth": 0}, {"key": "37220221", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067226830718, "ground_truth": 0}, {"key": "37220221", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267772119097, "ground_truth": 0}, {"key": "38815218", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9511422270621289, "ground_truth": 0}, {"key": "38815218", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9515039964884651, "ground_truth": 0}, {"key": "38815218", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9178933800519041, "ground_truth": 0}, {"key": "38815218", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9343951636240235, "ground_truth": 0}, {"key": "38815218", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9629528296972192, "ground_truth": 0}, {"key": "39379109", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6495786155245707, "ground_truth": 0}, {"key": "39379109", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6671477004317005, "ground_truth": 0}, {"key": "39379109", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7122321839072339, "ground_truth": 0}, {"key": "39379109", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684610433428, "ground_truth": 0}, {"key": "39379109", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381516172352, "ground_truth": 0}, {"key": "14576125", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.3090237066183964, "ground_truth": 0}, {"key": "14576125", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6187804428351067, "ground_truth": 0}, {"key": "14576125", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.2674081332591714, "ground_truth": 0}, {"key": "14576125", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306416901838836, "ground_truth": 0}, {"key": "14576125", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.31912139127813394, "ground_truth": 0}, {"key": "40814250", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7416740171340107, "ground_truth": 0}, {"key": "40814250", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303188406522, "ground_truth": 0}, {"key": "40814250", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619313138553, "ground_truth": 0}, {"key": "40814250", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545651089751, "ground_truth": 0}, {"key": "40814250", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431989717329, "ground_truth": 0}, {"key": "36334488", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.661922867079613, "ground_truth": 0}, {"key": "36334488", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.573678418046354, "ground_truth": 0}, {"key": "36334488", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7416740191085268, "ground_truth": 0}, {"key": "36334488", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948145651724, "ground_truth": 0}, {"key": "36334488", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.675764611137566, "ground_truth": 0}, {"key": "36888322", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7718435091263443, "ground_truth": 0}, {"key": "36888322", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.880797080207693, "ground_truth": 0}, {"key": "36888322", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256434234466, "ground_truth": 0}, {"key": "36888322", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367967331335, "ground_truth": 0}, {"key": "36888322", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.841825650078265, "ground_truth": 0}, {"key": "37318916", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9224823436367106, "ground_truth": 0}, {"key": "37318916", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9462003571201438, "ground_truth": 0}, {"key": "37318916", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9529258194173701, "ground_truth": 0}, {"key": "37318916", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9441768647772255, "ground_truth": 0}, {"key": "37318916", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.92995104082729, "ground_truth": 0}, {"key": "39308700", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5563995762098713, "ground_truth": 0}, {"key": "39308700", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6992544062104682, "ground_truth": 0}, {"key": "39308700", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7648916134484194, "ground_truth": 0}, {"key": "39308700", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033557882116, "ground_truth": 0}, {"key": "39308700", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737274692508, "ground_truth": 0}, {"key": "31061543", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.713830765738862, "ground_truth": 0}, {"key": "31061543", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8872045852976087, "ground_truth": 0}, {"key": "31061543", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8499711675529802, "ground_truth": 0}, {"key": "31061543", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9241418227698028, "ground_truth": 0}, {"key": "31061543", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835481659717, "ground_truth": 0}, {"key": "37380894", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673050283661, "ground_truth": 0}, {"key": "37380894", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8344068961006198, "ground_truth": 0}, {"key": "37380894", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8354835561489415, "ground_truth": 0}, {"key": "37380894", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361682779267, "ground_truth": 0}, {"key": "37380894", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005298041054569, "ground_truth": 0}, {"key": "38410139", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6132365434269597, "ground_truth": 0}, {"key": "38410139", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.670608293815994, "ground_truth": 0}, {"key": "38410139", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8386797690446918, "ground_truth": 0}, {"key": "38410139", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680323250548, "ground_truth": 0}, {"key": "38410139", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359835027369, "ground_truth": 0}, {"key": "35953842", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.684264006841712, "ground_truth": 0}, {"key": "35953842", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9059898172073242, "ground_truth": 0}, {"key": "35953842", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.724870274693503, "ground_truth": 0}, {"key": "35953842", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089368233865, "ground_truth": 0}, {"key": "35953842", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.729519793411606, "ground_truth": 0}, {"key": "39815663", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228292856693, "ground_truth": 0}, {"key": "39815663", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7918210586615774, "ground_truth": 0}, {"key": "39815663", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6842640304103671, "ground_truth": 0}, {"key": "39815663", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891294948982, "ground_truth": 0}, {"key": "39815663", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995903065461, "ground_truth": 0}, {"key": "35121432", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9289263302821014, "ground_truth": 0}, {"key": "35121432", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8969755774999828, "ground_truth": 0}, {"key": "35121432", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9348724462965049, "ground_truth": 0}, {"key": "35121432", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096095640315, "ground_truth": 0}, {"key": "35121432", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473692702702, "ground_truth": 0}, {"key": "21712310", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706083036717848, "ground_truth": 0}, {"key": "21712310", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6297746141743624, "ground_truth": 0}, {"key": "21712310", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6825737227113193, "ground_truth": 0}, {"key": "21712310", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253748821681, "ground_truth": 0}, {"key": "21712310", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105753397014, "ground_truth": 0}, {"key": "37952914", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8187368045728575, "ground_truth": 0}, {"key": "37952914", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159567265981, "ground_truth": 0}, {"key": "37952914", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8643104646150884, "ground_truth": 0}, {"key": "37952914", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677583811233, "ground_truth": 0}, {"key": "37952914", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.845942448210421, "ground_truth": 0}, {"key": "38956779", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5907791915878894, "ground_truth": 0}, {"key": "38956779", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6992544227937775, "ground_truth": 0}, {"key": "38956779", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6315942914411313, "ground_truth": 0}, {"key": "38956779", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646037262733, "ground_truth": 0}, {"key": "38956779", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315942781513547, "ground_truth": 0}, {"key": "36101833", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673070730752, "ground_truth": 0}, {"key": "36101833", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.839733974980624, "ground_truth": 0}, {"key": "36101833", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8278281312178425, "ground_truth": 0}, {"key": "36101833", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624869392027, "ground_truth": 0}, {"key": "36101833", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437730784055, "ground_truth": 0}, {"key": "35544662", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976089070157386, "ground_truth": 0}, {"key": "35544662", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7745833937275572, "ground_truth": 0}, {"key": "35544662", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5736784310197118, "ground_truth": 0}, {"key": "35544662", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240844493412, "ground_truth": 0}, {"key": "35544662", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321903012576, "ground_truth": 0}, {"key": "39759044", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036156116192, "ground_truth": 0}, {"key": "39759044", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8092759720734728, "ground_truth": 0}, {"key": "39759044", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8568122961166401, "ground_truth": 0}, {"key": "39759044", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382034458801, "ground_truth": 0}, {"key": "39759044", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337079486083, "ground_truth": 0}, {"key": "39433018", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9111796993261725, "ground_truth": 0}, {"key": "39433018", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9246876920463503, "ground_truth": 0}, {"key": "39433018", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9059898198369742, "ground_truth": 0}, {"key": "39433018", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898244166005, "ground_truth": 0}, {"key": "39433018", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.905989819416909, "ground_truth": 0}, {"key": "22111959", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8140527928216328, "ground_truth": 0}, {"key": "22111959", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300379099759, "ground_truth": 0}, {"key": "22111959", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867922890189, "ground_truth": 0}, {"key": "22111959", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936545421091, "ground_truth": 0}, {"key": "22111959", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506531566744, "ground_truth": 0}, {"key": "38210094", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666686818384, "ground_truth": 0}, {"key": "38210094", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5350984578996973, "ground_truth": 0}, {"key": "38210094", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5698526484735472, "ground_truth": 0}, {"key": "38210094", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317168374994, "ground_truth": 0}, {"key": "38210094", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.49609381889207355, "ground_truth": 0}, {"key": "37675935", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8469578317423389, "ground_truth": 0}, {"key": "37675935", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.869714580740108, "ground_truth": 0}, {"key": "37675935", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104789178401254, "ground_truth": 0}, {"key": "37675935", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358506844433, "ground_truth": 0}, {"key": "37675935", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897132971524, "ground_truth": 0}, {"key": "35732604", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6688802585036108, "ground_truth": 0}, {"key": "35732604", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5869964420722548, "ground_truth": 0}, {"key": "35732604", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6020615764479105, "ground_truth": 0}, {"key": "35732604", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666431563642, "ground_truth": 0}, {"key": "35732604", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300694877139, "ground_truth": 0}, {"key": "27453212", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.84695784319735, "ground_truth": 0}, {"key": "27453212", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324907392702, "ground_truth": 0}, {"key": "27453212", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879312078992043, "ground_truth": 0}, {"key": "27453212", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624944805531, "ground_truth": 0}, {"key": "27453212", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117847103163, "ground_truth": 0}, {"key": "39910047", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6636689193877665, "ground_truth": 0}, {"key": "39910047", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.779992910842676, "ground_truth": 0}, {"key": "39910047", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.75922541568569, "ground_truth": 0}, {"key": "39910047", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307862436975, "ground_truth": 0}, {"key": "39910047", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228473306342, "ground_truth": 0}, {"key": "40054265", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6242935435305816, "ground_truth": 0}, {"key": "40054265", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5525397106316745, "ground_truth": 0}, {"key": "40054265", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7549149864677622, "ground_truth": 0}, {"key": "40054265", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982200255387, "ground_truth": 0}, {"key": "40054265", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.629774595501357, "ground_truth": 0}, {"key": "19984615", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7577943659607167, "ground_truth": 0}, {"key": "19984615", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6959583170930019, "ground_truth": 0}, {"key": "19984615", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8278281454693096, "ground_truth": 0}, {"key": "19984615", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.624293536323837, "ground_truth": 0}, {"key": "19984615", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.734119511398904, "ground_truth": 0}, {"key": "16490806", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.49609383063552526, "ground_truth": 0}, {"key": "16490806", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6297746241919855, "ground_truth": 0}, {"key": "16490806", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6723317180066751, "ground_truth": 0}, {"key": "16490806", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118465798866, "ground_truth": 0}, {"key": "16490806", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585789887372, "ground_truth": 0}, {"key": "36396237", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.950410972156184, "ground_truth": 0}, {"key": "36396237", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9385759507129818, "ground_truth": 0}, {"key": "36396237", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9702399059040645, "ground_truth": 0}, {"key": "36396237", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179886005332, "ground_truth": 0}, {"key": "36396237", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418104143895, "ground_truth": 0}, {"key": "40726444", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204086498372, "ground_truth": 0}, {"key": "40726444", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8489722108348293, "ground_truth": 0}, {"key": "40726444", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256613259558, "ground_truth": 0}, {"key": "40726444", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919919057855, "ground_truth": 0}, {"key": "40726444", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382058423906, "ground_truth": 0}, {"key": "37314826", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7386690825007729, "ground_truth": 0}, {"key": "37314826", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6774740106014067, "ground_truth": 0}, {"key": "37314826", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7325918488209434, "ground_truth": 0}, {"key": "37314826", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802632206818, "ground_truth": 0}, {"key": "37314826", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159618179896, "ground_truth": 0}, {"key": "38506971", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6688802591259582, "ground_truth": 0}, {"key": "38506971", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6774740276519678, "ground_truth": 0}, {"key": "38506971", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7520125757392396, "ground_truth": 0}, {"key": "38506971", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679365963947826, "ground_truth": 0}, {"key": "38506971", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326184455282664, "ground_truth": 0}, {"key": "40699312", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267118089885102, "ground_truth": 0}, {"key": "40699312", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8031738176939414, "ground_truth": 0}, {"key": "40699312", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8791467507646824, "ground_truth": 0}, {"key": "40699312", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970845814077, "ground_truth": 0}, {"key": "40699312", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059285521115, "ground_truth": 0}, {"key": "34695474", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228407969897, "ground_truth": 0}, {"key": "34695474", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7122321959091308, "ground_truth": 0}, {"key": "34695474", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6842640247083699, "ground_truth": 0}, {"key": "34695474", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105422608514, "ground_truth": 0}, {"key": "34695474", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837770447789, "ground_truth": 0}, {"key": "36281498", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8568122913552761, "ground_truth": 0}, {"key": "36281498", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8688267745462327, "ground_truth": 0}, {"key": "36281498", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8976952822809506, "ground_truth": 0}, {"key": "36281498", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549497863268, "ground_truth": 0}, {"key": "36281498", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972787374966, "ground_truth": 0}, {"key": "39558652", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976089204705529, "ground_truth": 0}, {"key": "39558652", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6279512163951859, "ground_truth": 0}, {"key": "39558652", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.779992904829725, "ground_truth": 0}, {"key": "39558652", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916116902933, "ground_truth": 0}, {"key": "39558652", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.613236555527736, "ground_truth": 0}, {"key": "37330579", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6150878714040645, "ground_truth": 0}, {"key": "37330579", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7416740249812923, "ground_truth": 0}, {"key": "37330579", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5058591074072182, "ground_truth": 0}, {"key": "37330579", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061602297132, "ground_truth": 0}, {"key": "37330579", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527622440004, "ground_truth": 0}, {"key": "40547658", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8080672012497176, "ground_truth": 0}, {"key": "40547658", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526168005664, "ground_truth": 0}, {"key": "40547658", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8300437771045683, "ground_truth": 0}, {"key": "40547658", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366418815209, "ground_truth": 0}, {"key": "40547658", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891221315283, "ground_truth": 0}, {"key": "37119340", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892336886555038, "ground_truth": 0}, {"key": "37119340", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7563575577671395, "ground_truth": 0}, {"key": "37119340", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7461390123473955, "ground_truth": 0}, {"key": "37119340", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689554399569, "ground_truth": 0}, {"key": "37119340", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.740174377156133, "ground_truth": 0}, {"key": "35301627", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6370307856327461, "ground_truth": 0}, {"key": "35301627", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5926665692559218, "ground_truth": 0}, {"key": "35301627", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7648916032498305, "ground_truth": 0}, {"key": "35301627", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.712232219201385, "ground_truth": 0}, {"key": "35301627", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416591576975, "ground_truth": 0}, {"key": "34037168", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7704647947824302, "ground_truth": 0}, {"key": "34037168", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760209680831, "ground_truth": 0}, {"key": "34037168", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6959583182891353, "ground_truth": 0}, {"key": "34037168", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.680878592013409, "ground_truth": 0}, {"key": "34037168", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715197115346, "ground_truth": 0}, {"key": "39703862", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.954984469119957, "ground_truth": 0}, {"key": "39703862", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9118099579992196, "ground_truth": 0}, {"key": "39703862", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9207896800227735, "ground_truth": 0}, {"key": "39703862", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9496693630877374, "ground_truth": 0}, {"key": "39703862", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.946200357275391, "ground_truth": 0}, {"key": "16554814", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9299510410722059, "ground_truth": 0}, {"key": "16554814", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9674102580264212, "ground_truth": 0}, {"key": "16554814", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9257686301747166, "ground_truth": 0}, {"key": "16554814", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.939024816542599, "ground_truth": 0}, {"key": "16554814", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127490448292, "ground_truth": 0}, {"key": "32983099", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4571367325894655, "ground_truth": 0}, {"key": "32983099", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5888891214000797, "ground_truth": 0}, {"key": "32983099", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.48828340946036575, "ground_truth": 0}, {"key": "32983099", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414087747636526, "ground_truth": 0}, {"key": "32983099", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093526756082, "ground_truth": 0}, {"key": "41072994", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.540923873589669, "ground_truth": 0}, {"key": "41072994", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7592253853579972, "ground_truth": 0}, {"key": "41072994", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6279512125761588, "ground_truth": 0}, {"key": "41072994", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102586115199, "ground_truth": 0}, {"key": "41072994", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819586980422, "ground_truth": 0}, {"key": "38396247", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267117906986658, "ground_truth": 0}, {"key": "38396247", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267118023220814, "ground_truth": 0}, {"key": "38396247", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757870058701227, "ground_truth": 0}, {"key": "38396247", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9092645182554316, "ground_truth": 0}, {"key": "38396247", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9376689659960854, "ground_truth": 0}, {"key": "37507998", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8365545502323609, "ground_truth": 0}, {"key": "37507998", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8300437857751423, "ground_truth": 0}, {"key": "37507998", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8568123150265379, "ground_truth": 0}, {"key": "37507998", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267118041837705, "ground_truth": 0}, {"key": "37507998", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.860603627423679, "ground_truth": 0}, {"key": "32593929", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082715574356, "ground_truth": 0}, {"key": "32593929", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7310585825002426, "ground_truth": 0}, {"key": "32593929", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6584175084300574, "ground_truth": 0}, {"key": "32593929", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.690976299921007, "ground_truth": 0}, {"key": "32593929", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948101507638, "ground_truth": 0}, {"key": "36056449", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4282334074848347, "ground_truth": 0}, {"key": "36056449", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.42250464532616433, "ground_truth": 0}, {"key": "36056449", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5467381620765375, "ground_truth": 0}, {"key": "36056449", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665963627866, "ground_truth": 0}, {"key": "36056449", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891360344306, "ground_truth": 0}, {"key": "21986185", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.33111973630665986, "ground_truth": 0}, {"key": "21986185", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.24220563704270806, "ground_truth": 0}, {"key": "21986185", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.43014735086779393, "ground_truth": 0}, {"key": "21986185", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.486331523616376, "ground_truth": 0}, {"key": "21986185", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016878027463556, "ground_truth": 0}, {"key": "40757465", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7090191301764847, "ground_truth": 0}, {"key": "40757465", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5679366354502888, "ground_truth": 0}, {"key": "40757465", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7025300509437604, "ground_truth": 0}, {"key": "40757465", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819538631955, "ground_truth": 0}, {"key": "40757465", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191363740516, "ground_truth": 0}, {"key": "35198313", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6261241872054255, "ground_truth": 0}, {"key": "35198313", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7866228186249407, "ground_truth": 0}, {"key": "35198313", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6513548711846968, "ground_truth": 0}, {"key": "35198313", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640429912709, "ground_truth": 0}, {"key": "35198313", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159631231842, "ground_truth": 0}, {"key": "30604618", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6791787345951334, "ground_truth": 0}, {"key": "30604618", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998526301954, "ground_truth": 0}, {"key": "30604618", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7217432192774619, "ground_truth": 0}, {"key": "30604618", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317050041763, "ground_truth": 0}, {"key": "30604618", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317132475115, "ground_truth": 0}, {"key": "35779006", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6757645808753312, "ground_truth": 0}, {"key": "35779006", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7879312097965504, "ground_truth": 0}, {"key": "35779006", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6442251242745224, "ground_truth": 0}, {"key": "35779006", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324531136958, "ground_truth": 0}, {"key": "35779006", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943707358782, "ground_truth": 0}, {"key": "33858956", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7969253649050788, "ground_truth": 0}, {"key": "33858956", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6495786046285345, "ground_truth": 0}, {"key": "33858956", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7994423282826194, "ground_truth": 0}, {"key": "33858956", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897177442179, "ground_truth": 0}, {"key": "33858956", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300604423923, "ground_truth": 0}, {"key": "38633880", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7772998530805081, "ground_truth": 0}, {"key": "38633880", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7943849467777253, "ground_truth": 0}, {"key": "38633880", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7905303050578512, "ground_truth": 0}, {"key": "38633880", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850138952523, "ground_truth": 0}, {"key": "38633880", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.658417460538173, "ground_truth": 0}, {"key": "36654905", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9750122060780481, "ground_truth": 0}, {"key": "36654905", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9890130576917417, "ground_truth": 0}, {"key": "36654905", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9556514182204281, "ground_truth": 0}, {"key": "36654905", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691381987351, "ground_truth": 0}, {"key": "36654905", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9518632311760358, "ground_truth": 0}, {"key": "26547482", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5292633914768093, "ground_truth": 0}, {"key": "26547482", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5136684727751324, "ground_truth": 0}, {"key": "26547482", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5813031030872373, "ground_truth": 0}, {"key": "26547482", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.63883529322578, "ground_truth": 0}, {"key": "26547482", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.554470450726163, "ground_truth": 0}, {"key": "36439068", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7839884680768321, "ground_truth": 0}, {"key": "36439068", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8438951079354031, "ground_truth": 0}, {"key": "36439068", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118762805587, "ground_truth": 0}, {"key": "36439068", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666541262355, "ground_truth": 0}, {"key": "36439068", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216293333108, "ground_truth": 0}, {"key": "30501258", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.954984467195271, "ground_truth": 0}, {"key": "30501258", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9412234445391893, "ground_truth": 0}, {"key": "30501258", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9268352853385703, "ground_truth": 0}, {"key": "30501258", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9190632883877636, "ground_truth": 0}, {"key": "30501258", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277828594262, "ground_truth": 0}, {"key": "37560941", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8548846371067401, "ground_truth": 0}, {"key": "37560941", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145914148627, "ground_truth": 0}, {"key": "37560941", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7826624921124787, "ground_truth": 0}, {"key": "37560941", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094005678088, "ground_truth": 0}, {"key": "37560941", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631412504112, "ground_truth": 0}, {"key": "36801665", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8840392829666986, "ground_truth": 0}, {"key": "36801665", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9046505336604561, "ground_truth": 0}, {"key": "36801665", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8910549556530538, "ground_truth": 0}, {"key": "36801665", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206750118249, "ground_truth": 0}, {"key": "36801665", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213663645585, "ground_truth": 0}, {"key": "34954610", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082801920539, "ground_truth": 0}, {"key": "34954610", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6315943051915747, "ground_truth": 0}, {"key": "34954610", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6297745991044534, "ground_truth": 0}, {"key": "34954610", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.58320337726356, "ground_truth": 0}, {"key": "34954610", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.737158156946355, "ground_truth": 0}, {"key": "37020510", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303129175809, "ground_truth": 0}, {"key": "37020510", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526179546743, "ground_truth": 0}, {"key": "37020510", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6876299873007042, "ground_truth": 0}, {"key": "37020510", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324838225459, "ground_truth": 0}, {"key": "37020510", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.786622826578711, "ground_truth": 0}, {"key": "38064637", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6477982275997467, "ground_truth": 0}, {"key": "38064637", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5175708859605799, "ground_truth": 0}, {"key": "38064637", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.48633152212861414, "ground_truth": 0}, {"key": "38064637", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056047697032, "ground_truth": 0}, {"key": "38064637", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268348390488946, "ground_truth": 0}, {"key": "40886108", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9437636559986619, "ground_truth": 0}, {"key": "40886108", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8529354801808982, "ground_truth": 0}, {"key": "40886108", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148166858997, "ground_truth": 0}, {"key": "40886108", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178953107745, "ground_truth": 0}, {"key": "40886108", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107966627575, "ground_truth": 0}, {"key": "38554603", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526252381385, "ground_truth": 0}, {"key": "38554603", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8499711817681004, "ground_truth": 0}, {"key": "38554603", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7106283154027291, "ground_truth": 0}, {"key": "38554603", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366282083429, "ground_truth": 0}, {"key": "38554603", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825803235497, "ground_truth": 0}, {"key": "39115586", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6442251045204648, "ground_truth": 0}, {"key": "39115586", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7356416633201198, "ground_truth": 0}, {"key": "39115586", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6992544282425226, "ground_truth": 0}, {"key": "39115586", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680085055075, "ground_truth": 0}, {"key": "39115586", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159412565779, "ground_truth": 0}, {"key": "38786314", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675407367977, "ground_truth": 0}, {"key": "38786314", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8278281636751325, "ground_truth": 0}, {"key": "38786314", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8587185822906647, "ground_truth": 0}, {"key": "38786314", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759829018622, "ground_truth": 0}, {"key": "38786314", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789213317992, "ground_truth": 0}, {"key": "38721078", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9433475674584572, "ground_truth": 0}, {"key": "38721078", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9367494753348165, "ground_truth": 0}, {"key": "38721078", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.906653116288611, "ground_truth": 0}, {"key": "38721078", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.948154532559575, "ground_truth": 0}, {"key": "38721078", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9469902276946256, "ground_truth": 0}, {"key": "39475467", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6242935269672002, "ground_truth": 0}, {"key": "39475467", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6388352784387947, "ground_truth": 0}, {"key": "39475467", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339768547399, "ground_truth": 0}, {"key": "39475467", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646011639017, "ground_truth": 0}, {"key": "39475467", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936498904223, "ground_truth": 0}, {"key": "35691234", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.67405047206167, "ground_truth": 0}, {"key": "35691234", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7549149818457237, "ground_truth": 0}, {"key": "35691234", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6261242007436078, "ground_truth": 0}, {"key": "35691234", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476652558009, "ground_truth": 0}, {"key": "35691234", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321781458837, "ground_truth": 0}, {"key": "36871390", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7577943662675347, "ground_truth": 0}, {"key": "36871390", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8164063678676303, "ground_truth": 0}, {"key": "36871390", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998506438522, "ground_truth": 0}, {"key": "36871390", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884635543328, "ground_truth": 0}, {"key": "36871390", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883731258852, "ground_truth": 0}, {"key": "31730844", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493132931502, "ground_truth": 0}, {"key": "31730844", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6352224281863409, "ground_truth": 0}, {"key": "31730844", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8991213839560996, "ground_truth": 0}, {"key": "31730844", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549520734379, "ground_truth": 0}, {"key": "31730844", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545662106744, "ground_truth": 0}, {"key": "30810940", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7217432109697522, "ground_truth": 0}, {"key": "30810940", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6548947349241199, "ground_truth": 0}, {"key": "30810940", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7563575716741964, "ground_truth": 0}, {"key": "30810940", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740136431448, "ground_truth": 0}, {"key": "30810940", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891383452379, "ground_truth": 0}, {"key": "39352003", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8791467569132969, "ground_truth": 0}, {"key": "39352003", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.894789459694651, "ground_truth": 0}, {"key": "39352003", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8976952882157085, "ground_truth": 0}, {"key": "39352003", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122164471443, "ground_truth": 0}, {"key": "39352003", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772397269327, "ground_truth": 0}, {"key": "40118123", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.573678424740477, "ground_truth": 0}, {"key": "40118123", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.783988459057698, "ground_truth": 0}, {"key": "40118123", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6876300061085404, "ground_truth": 0}, {"key": "40118123", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544332356689, "ground_truth": 0}, {"key": "40118123", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601462315917, "ground_truth": 0}, {"key": "37114191", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5640984675501118, "ground_truth": 0}, {"key": "37114191", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5078118279047015, "ground_truth": 0}, {"key": "37114191", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6150878702435604, "ground_truth": 0}, {"key": "37114191", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.586996433698291, "ground_truth": 0}, {"key": "37114191", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754066091609934, "ground_truth": 0}, {"key": "39268203", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489721878536532, "ground_truth": 0}, {"key": "39268203", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8757870101061429, "ground_truth": 0}, {"key": "39268203", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.78133062254049, "ground_truth": 0}, {"key": "39268203", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.809275989352948, "ground_truth": 0}, {"key": "39268203", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199620080275, "ground_truth": 0}, {"key": "37950968", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7648916284328127, "ground_truth": 0}, {"key": "37950968", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6791786946803432, "ground_truth": 0}, {"key": "37950968", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867775213769, "ground_truth": 0}, {"key": "37950968", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434916881974, "ground_truth": 0}, {"key": "37950968", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786129290707, "ground_truth": 0}, {"key": "34959807", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7969253700161949, "ground_truth": 0}, {"key": "34959807", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7732163676295051, "ground_truth": 0}, {"key": "34959807", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8479677467957957, "ground_truth": 0}, {"key": "34959807", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898226542337, "ground_truth": 0}, {"key": "34959807", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.756357556734713, "ground_truth": 0}, {"key": "35631314", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8679338331280273, "ground_truth": 0}, {"key": "35631314", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8624675389638154, "ground_truth": 0}, {"key": "35631314", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9046505329729716, "ground_truth": 0}, {"key": "35631314", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122187492031, "ground_truth": 0}, {"key": "35631314", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117949406455, "ground_truth": 0}, {"key": "38082365", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8255897223099216, "ground_truth": 0}, {"key": "38082365", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7325918350861881, "ground_truth": 0}, {"key": "38082365", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159478779351, "ground_truth": 0}, {"key": "38082365", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152325015889426, "ground_truth": 0}, {"key": "38082365", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.816406375479948, "ground_truth": 0}, {"key": "37242829", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8479677641890776, "ground_truth": 0}, {"key": "37242829", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680130265662, "ground_truth": 0}, {"key": "37242829", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6477982188810147, "ground_truth": 0}, {"key": "37242829", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089062422903, "ground_truth": 0}, {"key": "37242829", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431679926005536, "ground_truth": 0}, {"key": "38556068", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7201715219438554, "ground_truth": 0}, {"key": "38556068", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006920209305177, "ground_truth": 0}, {"key": "38556068", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.660172382875788, "ground_truth": 0}, {"key": "38556068", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935148583957, "ground_truth": 0}, {"key": "38556068", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476687102049, "ground_truth": 0}, {"key": "32969336", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976089069565244, "ground_truth": 0}, {"key": "32969336", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8887588015147717, "ground_truth": 0}, {"key": "32969336", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8354835399207573, "ground_truth": 0}, {"key": "32969336", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311856048061, "ground_truth": 0}, {"key": "32969336", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228483081311, "ground_truth": 0}, {"key": "36825153", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163648843572, "ground_truth": 0}, {"key": "36825153", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.734119523885035, "ground_truth": 0}, {"key": "36825153", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006919968883514, "ground_truth": 0}, {"key": "36825153", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463118842817464, "ground_truth": 0}, {"key": "36825153", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389893289552, "ground_truth": 0}, {"key": "41050146", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8910549640509097, "ground_truth": 0}, {"key": "41050146", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8962513719676303, "ground_truth": 0}, {"key": "41050146", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8606036225304414, "ground_truth": 0}, {"key": "41050146", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104553961473, "ground_truth": 0}, {"key": "41050146", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009630255808, "ground_truth": 0}, {"key": "27865037", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601465146238, "ground_truth": 0}, {"key": "27865037", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5794004398447506, "ground_truth": 0}, {"key": "27865037", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6279512205100876, "ground_truth": 0}, {"key": "27865037", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.620621615563893, "ground_truth": 0}, {"key": "27865037", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786939927188, "ground_truth": 0}, {"key": "39868565", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8832359930502879, "ground_truth": 0}, {"key": "39868565", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8902942258543218, "ground_truth": 0}, {"key": "39868565", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7969253763083309, "ground_truth": 0}, {"key": "39868565", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377661925751, "ground_truth": 0}, {"key": "39868565", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311827994606, "ground_truth": 0}, {"key": "37761968", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585990259476, "ground_truth": 0}, {"key": "37761968", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666583147616, "ground_truth": 0}, {"key": "37761968", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837546500153, "ground_truth": 0}, {"key": "37761968", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044058913353872, "ground_truth": 0}, {"key": "37761968", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056322029519015, "ground_truth": 0}, {"key": "16326139", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.61323655009551, "ground_truth": 0}, {"key": "16326139", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7264256062836975, "ground_truth": 0}, {"key": "16326139", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431680065165582, "ground_truth": 0}, {"key": "16326139", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.760650664950346, "ground_truth": 0}, {"key": "16326139", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.564098488259817, "ground_truth": 0}, {"key": "36568381", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9173026572425449, "ground_truth": 0}, {"key": "36568381", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545649352522, "ground_truth": 0}, {"key": "36568381", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9099070030878577, "ground_truth": 0}, {"key": "36568381", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9213576145673744, "ground_truth": 0}, {"key": "36568381", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274117367111, "ground_truth": 0}, {"key": "39855613", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8198933367193119, "ground_truth": 0}, {"key": "39855613", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.790530331468899, "ground_truth": 0}, {"key": "39855613", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8140528019692738, "ground_truth": 0}, {"key": "39855613", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366429900123, "ground_truth": 0}, {"key": "39855613", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933423883882, "ground_truth": 0}, {"key": "29856302", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6224593309312885, "ground_truth": 0}, {"key": "29856302", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6113819495829363, "ground_truth": 0}, {"key": "29856302", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6242935420625345, "ground_truth": 0}, {"key": "29856302", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849531596207, "ground_truth": 0}, {"key": "29856302", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.620621611610296, "ground_truth": 0}, {"key": "35641106", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493072251384, "ground_truth": 0}, {"key": "35641106", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.839733978198364, "ground_truth": 0}, {"key": "35641106", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7416740186614308, "ground_truth": 0}, {"key": "35641106", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583303093654, "ground_truth": 0}, {"key": "35641106", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253947306427, "ground_truth": 0}, {"key": "39474558", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7233094820009285, "ground_truth": 0}, {"key": "39474558", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.713830717617052, "ground_truth": 0}, {"key": "39474558", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.672331693286225, "ground_truth": 0}, {"key": "39474558", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.828938801916224, "ground_truth": 0}, {"key": "39474558", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059172382569, "ground_truth": 0}, {"key": "34338135", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887588014928642, "ground_truth": 0}, {"key": "34338135", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.847967764389975, "ground_truth": 0}, {"key": "34338135", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9329437106418232, "ground_truth": 0}, {"key": "34338135", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026096025741422, "ground_truth": 0}, {"key": "34338135", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745084391454, "ground_truth": 0}, {"key": "35870330", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849541377324, "ground_truth": 0}, {"key": "35870330", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8643104501362076, "ground_truth": 0}, {"key": "35870330", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9079671432956051, "ground_truth": 0}, {"key": "35870330", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145944077188, "ground_truth": 0}, {"key": "35870330", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677544002767, "ground_truth": 0}, {"key": "24478245", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7813306361881354, "ground_truth": 0}, {"key": "24478245", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8615382135484808, "ground_truth": 0}, {"key": "24478245", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7956580976607585, "ground_truth": 0}, {"key": "24478245", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359961850311, "ground_truth": 0}, {"key": "24478245", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430373203513, "ground_truth": 0}, {"key": "38485946", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104789078309457, "ground_truth": 0}, {"key": "38485946", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300518892793, "ground_truth": 0}, {"key": "38485946", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6057990468122194, "ground_truth": 0}, {"key": "38485946", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053223092343778, "ground_truth": 0}, {"key": "38485946", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339674730566, "ground_truth": 0}, {"key": "32509613", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867742470565, "ground_truth": 0}, {"key": "32509613", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8624675109300277, "ground_truth": 0}, {"key": "32509613", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.860603631686309, "ground_truth": 0}, {"key": "32509613", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185894153778, "ground_truth": 0}, {"key": "32509613", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.79438495924106, "ground_truth": 0}, {"key": "34078819", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8140528117884546, "ground_truth": 0}, {"key": "34078819", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8418256444169238, "ground_truth": 0}, {"key": "34078819", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9005297868368405, "ground_truth": 0}, {"key": "34078819", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199689286942, "ground_truth": 0}, {"key": "34078819", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215377616002, "ground_truth": 0}, {"key": "39523865", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8998277744864579, "ground_truth": 0}, {"key": "39523865", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339630329875, "ground_truth": 0}, {"key": "39523865", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9046505413014737, "ground_truth": 0}, {"key": "39523865", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950872739036, "ground_truth": 0}, {"key": "39523865", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437636549604, "ground_truth": 0}, {"key": "33146158", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324911099105, "ground_truth": 0}, {"key": "33146158", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185812308737, "ground_truth": 0}, {"key": "33146158", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8624675329706413, "ground_truth": 0}, {"key": "33146158", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423361356298, "ground_truth": 0}, {"key": "33146158", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367777384934, "ground_truth": 0}, {"key": "32083974", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311922644513, "ground_truth": 0}, {"key": "32083974", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8187367959036531, "ground_truth": 0}, {"key": "32083974", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9403530558355644, "ground_truth": 0}, {"key": "32083974", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425346056676, "ground_truth": 0}, {"key": "32083974", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9207896764448625, "ground_truth": 0}, {"key": "34378482", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8933094065633984, "ground_truth": 0}, {"key": "34378482", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8984105502566311, "ground_truth": 0}, {"key": "34378482", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9339146271840392, "ground_truth": 0}, {"key": "34378482", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080779913688, "ground_truth": 0}, {"key": "34378482", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755716550465, "ground_truth": 0}, {"key": "38080102", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6495786104392746, "ground_truth": 0}, {"key": "38080102", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6636689304524631, "ground_truth": 0}, {"key": "38080102", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.690976285463758, "ground_truth": 0}, {"key": "38080102", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201715163327503, "ground_truth": 0}, {"key": "38080102", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324587993956, "ground_truth": 0}, {"key": "40244537", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6636689363379624, "ground_truth": 0}, {"key": "40244537", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6566582701201381, "ground_truth": 0}, {"key": "40244537", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5851011530736232, "ground_truth": 0}, {"key": "40244537", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185443343556, "ground_truth": 0}, {"key": "40244537", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878391882725, "ground_truth": 0}, {"key": "33497789", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9124361611974287, "ground_truth": 0}, {"key": "33497789", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.944994712156935, "ground_truth": 0}, {"key": "33497789", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.887204591905623, "ground_truth": 0}, {"key": "33497789", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067203797235, "ground_truth": 0}, {"key": "33497789", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677443685361, "ground_truth": 0}, {"key": "28816889", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9632305338794245, "ground_truth": 0}, {"key": "28816889", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9196425343253329, "ground_truth": 0}, {"key": "28816889", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.931462505577673, "ground_truth": 0}, {"key": "28816889", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425334694814, "ground_truth": 0}, {"key": "28816889", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576218821453, "ground_truth": 0}, {"key": "38157127", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601500192526, "ground_truth": 0}, {"key": "38157127", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7356416426262841, "ground_truth": 0}, {"key": "38157127", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431679982840903, "ground_truth": 0}, {"key": "38157127", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.694302660464414, "ground_truth": 0}, {"key": "38157127", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586152434209, "ground_truth": 0}, {"key": "36183569", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5717666042344027, "ground_truth": 0}, {"key": "36183569", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7416740212869514, "ground_truth": 0}, {"key": "36183569", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7154239998636815, "ground_truth": 0}, {"key": "36183569", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615714424131, "ground_truth": 0}, {"key": "36183569", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195281335489, "ground_truth": 0}, {"key": "36012016", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8233283949131766, "ground_truth": 0}, {"key": "36012016", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545491648975, "ground_truth": 0}, {"key": "36012016", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8697145901525587, "ground_truth": 0}, {"key": "36012016", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545572565047, "ground_truth": 0}, {"key": "36012016", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.901920672010282, "ground_truth": 0}, {"key": "34571973", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8006920016375142, "ground_truth": 0}, {"key": "34571973", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339799137571, "ground_truth": 0}, {"key": "34571973", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.884039282395878, "ground_truth": 0}, {"key": "34571973", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.835483535205975, "ground_truth": 0}, {"key": "34571973", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760339992546, "ground_truth": 0}, {"key": "38707498", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797620848091, "ground_truth": 0}, {"key": "38707498", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9130583420971142, "ground_truth": 0}, {"key": "38707498", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8774768013150002, "ground_truth": 0}, {"key": "38707498", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513737962092, "ground_truth": 0}, {"key": "38707498", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970795403798, "ground_truth": 0}, {"key": "35459082", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9462003577521887, "ground_truth": 0}, {"key": "35459082", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9783846681611575, "ground_truth": 0}, {"key": "35459082", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9252299573477831, "ground_truth": 0}, {"key": "35459082", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.954984468355308, "ground_truth": 0}, {"key": "35459082", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099642544294, "ground_truth": 0}, {"key": "39464041", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.966410492123737, "ground_truth": 0}, {"key": "39464041", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9645892682635975, "ground_truth": 0}, {"key": "39464041", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9770226314066536, "ground_truth": 0}, {"key": "39464041", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9763105297900423, "ground_truth": 0}, {"key": "39464041", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9572778016712168, "ground_truth": 0}, {"key": "23782052", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8633916031487302, "ground_truth": 0}, {"key": "23782052", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8791467729205414, "ground_truth": 0}, {"key": "23782052", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148311358364, "ground_truth": 0}, {"key": "23782052", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545606004821, "ground_truth": 0}, {"key": "23782052", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036105606346, "ground_truth": 0}, {"key": "36568455", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6876299927526338, "ground_truth": 0}, {"key": "36568455", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998549594823, "ground_truth": 0}, {"key": "36568455", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199838320219, "ground_truth": 0}, {"key": "36568455", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311882151571, "ground_truth": 0}, {"key": "36568455", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.821044119657813, "ground_truth": 0}, {"key": "38469552", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8976952955357559, "ground_truth": 0}, {"key": "38469552", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8670357563946206, "ground_truth": 0}, {"key": "38469552", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8976952962028865, "ground_truth": 0}, {"key": "38469552", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053223054023098, "ground_truth": 0}, {"key": "38469552", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942287055677, "ground_truth": 0}, {"key": "35922277", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8991213768626821, "ground_truth": 0}, {"key": "35922277", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9032942183665433, "ground_truth": 0}, {"key": "35922277", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631542797543, "ground_truth": 0}, {"key": "35922277", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.861538202040913, "ground_truth": 0}, {"key": "35922277", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299599157469, "ground_truth": 0}, {"key": "32744293", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8714748596359506, "ground_truth": 0}, {"key": "32744293", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619264490881, "ground_truth": 0}, {"key": "32744293", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9005297853513813, "ground_truth": 0}, {"key": "32744293", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.839733972872707, "ground_truth": 0}, {"key": "32744293", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711743114782, "ground_truth": 0}, {"key": "30972362", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9304582598216125, "ground_truth": 0}, {"key": "30972362", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9173026624357429, "ground_truth": 0}, {"key": "30972362", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9278877952584118, "ground_truth": 0}, {"key": "30972362", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.956634198155617, "ground_truth": 0}, {"key": "30972362", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9390248225727609, "ground_truth": 0}, {"key": "36380943", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210441004066587, "ground_truth": 0}, {"key": "36380943", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8749346190187434, "ground_truth": 0}, {"key": "36380943", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199736835157, "ground_truth": 0}, {"key": "36380943", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321922985095, "ground_truth": 0}, {"key": "36380943", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423178279776, "ground_truth": 0}, {"key": "36929355", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8244619208794921, "ground_truth": 0}, {"key": "36929355", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526249051207, "ground_truth": 0}, {"key": "36929355", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339789358093, "ground_truth": 0}, {"key": "36929355", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256578873637, "ground_truth": 0}, {"key": "36929355", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044058930025204, "ground_truth": 0}, {"key": "39127206", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7416740212947522, "ground_truth": 0}, {"key": "39127206", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5660185200310975, "ground_truth": 0}, {"key": "39127206", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5945512836460085, "ground_truth": 0}, {"key": "39127206", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872104038783, "ground_truth": 0}, {"key": "39127206", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943764452437, "ground_truth": 0}, {"key": "36128318", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666456698628, "ground_truth": 0}, {"key": "36128318", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7310585487880344, "ground_truth": 0}, {"key": "36128318", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094811230022, "ground_truth": 0}, {"key": "36128318", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059189765521, "ground_truth": 0}, {"key": "36128318", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239957631452, "ground_truth": 0}, {"key": "39863480", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.874934629014539, "ground_truth": 0}, {"key": "39863480", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8848377728600932, "ground_truth": 0}, {"key": "39863480", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8633916153200301, "ground_truth": 0}, {"key": "39863480", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346227425531, "ground_truth": 0}, {"key": "39863480", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344069043611764, "ground_truth": 0}, {"key": "38634057", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9012273989165799, "ground_truth": 0}, {"key": "38634057", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.91054539435012, "ground_truth": 0}, {"key": "38634057", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587897177051, "ground_truth": 0}, {"key": "38634057", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359870734158, "ground_truth": 0}, {"key": "38634057", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117899393571, "ground_truth": 0}, {"key": "33131935", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8749346163093359, "ground_truth": 0}, {"key": "33131935", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9299510459703055, "ground_truth": 0}, {"key": "33131935", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8976953038440729, "ground_truth": 0}, {"key": "33131935", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267794683739, "ground_truth": 0}, {"key": "33131935", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278710090029, "ground_truth": 0}, {"key": "39021319", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.821044092277392, "ground_truth": 0}, {"key": "39021319", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7138307444773391, "ground_truth": 0}, {"key": "39021319", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849605462595, "ground_truth": 0}, {"key": "39021319", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163622987073, "ground_truth": 0}, {"key": "39021319", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897190154745, "ground_truth": 0}, {"key": "40644571", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6825737526977201, "ground_truth": 0}, {"key": "40644571", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6477982197695616, "ground_truth": 0}, {"key": "40644571", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431680044308399, "ground_truth": 0}, {"key": "40644571", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689635887583, "ground_truth": 0}, {"key": "40644571", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849530953556, "ground_truth": 0}, {"key": "14681877", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9105453902627795, "ground_truth": 0}, {"key": "14681877", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.941223443413541, "ground_truth": 0}, {"key": "14681877", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.889528841893249, "ground_truth": 0}, {"key": "14681877", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284087980877943, "ground_truth": 0}, {"key": "14681877", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226722461431, "ground_truth": 0}, {"key": "36570890", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6297746326756336, "ground_truth": 0}, {"key": "36570890", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6187804093537791, "ground_truth": 0}, {"key": "36570890", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6261242114971854, "ground_truth": 0}, {"key": "36570890", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666319817419, "ground_truth": 0}, {"key": "36570890", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631863170625, "ground_truth": 0}, {"key": "30452755", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.894051713417538, "ground_truth": 0}, {"key": "30452755", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9012274147979081, "ground_truth": 0}, {"key": "30452755", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631314401739, "ground_truth": 0}, {"key": "30452755", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.800692022407436, "ground_truth": 0}, {"key": "30452755", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637488991573, "ground_truth": 0}, {"key": "37347053", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601507067112, "ground_truth": 0}, {"key": "37347053", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7310585898545857, "ground_truth": 0}, {"key": "37347053", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.881614903318881, "ground_truth": 0}, {"key": "37347053", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419766610415, "ground_truth": 0}, {"key": "37347053", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434997615501, "ground_truth": 0}, {"key": "38890979", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.773216345662717, "ground_truth": 0}, {"key": "38890979", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673209321272, "ground_truth": 0}, {"key": "38890979", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210441339324073, "ground_truth": 0}, {"key": "38890979", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445545710371, "ground_truth": 0}, {"key": "38890979", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929198008683, "ground_truth": 0}, {"key": "32974694", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8509646916504369, "ground_truth": 0}, {"key": "32974694", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9073122282258285, "ground_truth": 0}, {"key": "32974694", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879312066342079, "ground_truth": 0}, {"key": "32974694", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760122200259, "ground_truth": 0}, {"key": "32974694", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.843895092890578, "ground_truth": 0}, {"key": "38519940", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.862467533349044, "ground_truth": 0}, {"key": "38519940", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9099070013298884, "ground_truth": 0}, {"key": "38519940", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9473810461265775, "ground_truth": 0}, {"key": "38519940", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772332046551, "ground_truth": 0}, {"key": "38519940", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907212978725, "ground_truth": 0}, {"key": "38870104", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8940517175927376, "ground_truth": 0}, {"key": "38870104", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9289263317557954, "ground_truth": 0}, {"key": "38870104", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8991213863331529, "ground_truth": 0}, {"key": "38870104", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178943809516, "ground_truth": 0}, {"key": "38870104", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755688762052, "ground_truth": 0}, {"key": "34283161", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7676898584609038, "ground_truth": 0}, {"key": "34283161", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339845639369, "ground_truth": 0}, {"key": "34283161", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5292633803429645, "ground_truth": 0}, {"key": "34283161", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490871923266281, "ground_truth": 0}, {"key": "34283161", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666513040447, "ground_truth": 0}, {"key": "31650463", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8244619343973576, "ground_truth": 0}, {"key": "31650463", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.836554552272175, "ground_truth": 0}, {"key": "31650463", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933094118129203, "ground_truth": 0}, {"key": "31650463", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519527917042551, "ground_truth": 0}, {"key": "31650463", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789012068436, "ground_truth": 0}, {"key": "35589432", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797651125564, "ground_truth": 0}, {"key": "35589432", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8774767974593422, "ground_truth": 0}, {"key": "35589432", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8509647008858438, "ground_truth": 0}, {"key": "35589432", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204168003353, "ground_truth": 0}, {"key": "35589432", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306319579608, "ground_truth": 0}, {"key": "14412752", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281430506712, "ground_truth": 0}, {"key": "14412752", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8278281439255506, "ground_truth": 0}, {"key": "14412752", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104789182102443, "ground_truth": 0}, {"key": "14412752", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916138219265, "ground_truth": 0}, {"key": "14412752", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432078862653, "ground_truth": 0}, {"key": "37271183", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9658995742890357, "ground_truth": 0}, {"key": "37271183", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9381240107243225, "ground_truth": 0}, {"key": "37271183", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9539660991586435, "ground_truth": 0}, {"key": "37271183", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9496693678357768, "ground_truth": 0}, {"key": "37271183", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9585377291174454, "ground_truth": 0}, {"key": "35588153", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9372107971137925, "ground_truth": 0}, {"key": "35588153", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9118099464882752, "ground_truth": 0}, {"key": "35588153", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9053223024874576, "ground_truth": 0}, {"key": "35588153", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145795489001, "ground_truth": 0}, {"key": "35588153", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105524083655, "ground_truth": 0}, {"key": "39876692", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9053222955129396, "ground_truth": 0}, {"key": "39876692", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8807970831652545, "ground_truth": 0}, {"key": "39876692", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8633916153313307, "ground_truth": 0}, {"key": "39876692", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9190632831528692, "ground_truth": 0}, {"key": "39876692", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517107047024, "ground_truth": 0}, {"key": "38992323", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8872045888948504, "ground_truth": 0}, {"key": "38992323", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145941737228, "ground_truth": 0}, {"key": "38992323", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9019206711623029, "ground_truth": 0}, {"key": "38992323", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.769080230276539, "ground_truth": 0}, {"key": "38992323", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681082772924, "ground_truth": 0}, {"key": "37556002", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059578317546, "ground_truth": 0}, {"key": "37556002", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.731058585499501, "ground_truth": 0}, {"key": "37556002", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.817574467566069, "ground_truth": 0}, {"key": "37556002", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.836554567818421, "ground_truth": 0}, {"key": "37556002", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.775944569360906, "ground_truth": 0}, {"key": "39875801", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8705972722058994, "ground_truth": 0}, {"key": "39875801", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8998277825137297, "ground_truth": 0}, {"key": "39875801", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9105454115619092, "ground_truth": 0}, {"key": "39875801", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070052731175, "ground_truth": 0}, {"key": "39875801", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343685017892, "ground_truth": 0}, {"key": "39272285", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4320633839487603, "ground_truth": 0}, {"key": "39272285", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4320633940630463, "ground_truth": 0}, {"key": "39272285", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5486734489370477, "ground_truth": 0}, {"key": "39272285", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047871364552514, "ground_truth": 0}, {"key": "39272285", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367271244888, "ground_truth": 0}, {"key": "39629714", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8418256450225662, "ground_truth": 0}, {"key": "39629714", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7416739855926308, "ground_truth": 0}, {"key": "39629714", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7648916272214883, "ground_truth": 0}, {"key": "39629714", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619189988661, "ground_truth": 0}, {"key": "39629714", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802298828898, "ground_truth": 0}, {"key": "34043257", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9026095948598604, "ground_truth": 0}, {"key": "34043257", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.870597266691989, "ground_truth": 0}, {"key": "34043257", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8774767847292102, "ground_truth": 0}, {"key": "34043257", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583486239193, "ground_truth": 0}, {"key": "34043257", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767921880732, "ground_truth": 0}, {"key": "33995240", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6654105492170121, "ground_truth": 0}, {"key": "33995240", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6740504750450285, "ground_truth": 0}, {"key": "33995240", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5926665848973999, "ground_truth": 0}, {"key": "33995240", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381547522001, "ground_truth": 0}, {"key": "33995240", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270221603731, "ground_truth": 0}, {"key": "39399948", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8568122969318648, "ground_truth": 0}, {"key": "39399948", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7866228328626927, "ground_truth": 0}, {"key": "39399948", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7690802389466173, "ground_truth": 0}, {"key": "39399948", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894629808884, "ground_truth": 0}, {"key": "39399948", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310586135466255, "ground_truth": 0}, {"key": "33185890", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7401743501227518, "ground_truth": 0}, {"key": "33185890", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7606506677740232, "ground_truth": 0}, {"key": "33185890", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7264256098966473, "ground_truth": 0}, {"key": "33185890", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494722008589, "ground_truth": 0}, {"key": "33185890", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802677620569, "ground_truth": 0}, {"key": "35280425", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7718434953949048, "ground_truth": 0}, {"key": "35280425", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199557903682, "ground_truth": 0}, {"key": "35280425", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7866228183702426, "ground_truth": 0}, {"key": "35280425", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867927929428, "ground_truth": 0}, {"key": "35280425", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760189987928, "ground_truth": 0}, {"key": "16365170", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281523412673, "ground_truth": 0}, {"key": "16365170", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392805104349, "ground_truth": 0}, {"key": "16365170", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942355802996, "ground_truth": 0}, {"key": "16365170", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884479467881, "ground_truth": 0}, {"key": "16365170", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.846957851444076, "ground_truth": 0}, {"key": "24388238", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4610167730936178, "ground_truth": 0}, {"key": "24388238", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.73105860130676, "ground_truth": 0}, {"key": "24388238", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7446563525364417, "ground_truth": 0}, {"key": "24388238", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105531210546, "ground_truth": 0}, {"key": "24388238", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251025253128, "ground_truth": 0}, {"key": "35024827", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489722010918067, "ground_truth": 0}, {"key": "35024827", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8539127631709128, "ground_truth": 0}, {"key": "35024827", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.752012571121915, "ground_truth": 0}, {"key": "35024827", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581808052671, "ground_truth": 0}, {"key": "35024827", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303069679935, "ground_truth": 0}, {"key": "38624944", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228325917916, "ground_truth": 0}, {"key": "38624944", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8019358316452071, "ground_truth": 0}, {"key": "38624944", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879312046562775, "ground_truth": 0}, {"key": "38624944", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701196408353, "ground_truth": 0}, {"key": "38624944", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867780944042, "ground_truth": 0}, {"key": "34719830", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585828386311, "ground_truth": 0}, {"key": "34719830", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9130583436134367, "ground_truth": 0}, {"key": "34719830", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619228598798, "ground_truth": 0}, {"key": "34719830", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.878314231933518, "ground_truth": 0}, {"key": "34719830", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677556548759, "ground_truth": 0}, {"key": "38995225", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8333245908954733, "ground_truth": 0}, {"key": "38995225", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9190632818578846, "ground_truth": 0}, {"key": "38995225", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8925625243533797, "ground_truth": 0}, {"key": "38995225", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.894051714848928, "ground_truth": 0}, {"key": "38995225", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080760006313, "ground_truth": 0}, {"key": "34242311", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7853085975670022, "ground_truth": 0}, {"key": "34242311", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7732163629880652, "ground_truth": 0}, {"key": "34242311", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7690802605486626, "ground_truth": 0}, {"key": "34242311", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358283924668, "ground_truth": 0}, {"key": "34242311", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117834293022, "ground_truth": 0}, {"key": "39253748", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.961821724382176, "ground_truth": 0}, {"key": "39253748", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9213576233470587, "ground_truth": 0}, {"key": "39253748", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9263037292508155, "ground_truth": 0}, {"key": "39253748", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691489674237, "ground_truth": 0}, {"key": "39253748", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942282554533, "ground_truth": 0}, {"key": "37131104", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9943140933726922, "ground_truth": 0}, {"key": "37131104", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9964619137060449, "ground_truth": 0}, {"key": "37131104", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9967775163249512, "ground_truth": 0}, {"key": "37131104", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9918752911402199, "ground_truth": 0}, {"key": "37131104", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9911526453263285, "ground_truth": 0}, {"key": "38490554", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489722014994271, "ground_truth": 0}, {"key": "38490554", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8056321978221347, "ground_truth": 0}, {"key": "38490554", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8969755728394712, "ground_truth": 0}, {"key": "38490554", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505447467457, "ground_truth": 0}, {"key": "38490554", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278742162603, "ground_truth": 0}, {"key": "29009500", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6584174779968484, "ground_truth": 0}, {"key": "29009500", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6774740227448816, "ground_truth": 0}, {"key": "29009500", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.642432482794039, "ground_truth": 0}, {"key": "29009500", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303223684382, "ground_truth": 0}, {"key": "29009500", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063688514338, "ground_truth": 0}, {"key": "36703057", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.895522677646917, "ground_truth": 0}, {"key": "36703057", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185783096961, "ground_truth": 0}, {"key": "36703057", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8679338401085389, "ground_truth": 0}, {"key": "36703057", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799929019986596, "ground_truth": 0}, {"key": "36703057", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228180302833, "ground_truth": 0}, {"key": "34876987", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.944994710898866, "ground_truth": 0}, {"key": "34876987", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9343951574493358, "ground_truth": 0}, {"key": "34876987", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.959459261819768, "ground_truth": 0}, {"key": "34876987", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933751025483, "ground_truth": 0}, {"key": "34876987", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.966155967241956, "ground_truth": 0}, {"key": "36209258", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8705972677987043, "ground_truth": 0}, {"key": "36209258", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8344068799950013, "ground_truth": 0}, {"key": "36209258", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7310585813210535, "ground_truth": 0}, {"key": "36209258", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217431901809662, "ground_truth": 0}, {"key": "36209258", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578517525602, "ground_truth": 0}, {"key": "36854437", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445517834026, "ground_truth": 0}, {"key": "36854437", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5544704732497759, "ground_truth": 0}, {"key": "36854437", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5736784114584615, "ground_truth": 0}, {"key": "36854437", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.503906163341031, "ground_truth": 0}, {"key": "36854437", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185259856592, "ground_truth": 0}, {"key": "38047723", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850070076416, "ground_truth": 0}, {"key": "38047723", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159657704801, "ground_truth": 0}, {"key": "38047723", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6584175249924848, "ground_truth": 0}, {"key": "38047723", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149979503837, "ground_truth": 0}, {"key": "38047723", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445585612009, "ground_truth": 0}, {"key": "34287816", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7662936452187089, "ground_truth": 0}, {"key": "34287816", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185944060481071, "ground_truth": 0}, {"key": "34287816", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.800692004695036, "ground_truth": 0}, {"key": "34287816", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850400969595, "ground_truth": 0}, {"key": "34287816", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702903903295, "ground_truth": 0}, {"key": "33235855", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9621075713644606, "ground_truth": 0}, {"key": "33235855", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9728307698331013, "ground_truth": 0}, {"key": "33235855", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9394706095171265, "ground_truth": 0}, {"key": "33235855", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9697854118771184, "ground_truth": 0}, {"key": "33235855", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9553191292200677, "ground_truth": 0}, {"key": "34381016", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867746137408, "ground_truth": 0}, {"key": "34381016", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339583954269, "ground_truth": 0}, {"key": "34381016", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8019358176399357, "ground_truth": 0}, {"key": "34381016", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744860350449, "ground_truth": 0}, {"key": "34381016", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797709238382, "ground_truth": 0}, {"key": "28064995", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7416740166701262, "ground_truth": 0}, {"key": "28064995", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7826624812316135, "ground_truth": 0}, {"key": "28064995", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7505527717740245, "ground_truth": 0}, {"key": "28064995", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545662315376, "ground_truth": 0}, {"key": "28064995", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737930012312, "ground_truth": 0}, {"key": "37576197", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6020615992692169, "ground_truth": 0}, {"key": "37576197", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6531268947202304, "ground_truth": 0}, {"key": "37576197", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6352224399101639, "ground_truth": 0}, {"key": "37576197", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609382607272756, "ground_truth": 0}, {"key": "37576197", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.466845578469234, "ground_truth": 0}, {"key": "34454741", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5907791906566935, "ground_truth": 0}, {"key": "34454741", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7279754428362027, "ground_truth": 0}, {"key": "34454741", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163688130909, "ground_truth": 0}, {"key": "34454741", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256082136213, "ground_truth": 0}, {"key": "34454741", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228859837829, "ground_truth": 0}, {"key": "34766970", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6619228482964195, "ground_truth": 0}, {"key": "34766970", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5544704622109786, "ground_truth": 0}, {"key": "34766970", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.566018533661796, "ground_truth": 0}, {"key": "34766970", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419946933248, "ground_truth": 0}, {"key": "34766970", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366186329531, "ground_truth": 0}, {"key": "35574186", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9219218326017037, "ground_truth": 0}, {"key": "35574186", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.785308586836597, "ground_truth": 0}, {"key": "35574186", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.900529785364005, "ground_truth": 0}, {"key": "35574186", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278607487165, "ground_truth": 0}, {"key": "35574186", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338386424144, "ground_truth": 0}, {"key": "35486470", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7813306261204491, "ground_truth": 0}, {"key": "35486470", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.721743206864289, "ground_truth": 0}, {"key": "35486470", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8056321864220264, "ground_truth": 0}, {"key": "35486470", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976088768869484, "ground_truth": 0}, {"key": "35486470", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581628039228, "ground_truth": 0}, {"key": "40977702", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311922119752, "ground_truth": 0}, {"key": "40977702", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7549149597640615, "ground_truth": 0}, {"key": "40977702", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6808785989112828, "ground_truth": 0}, {"key": "40977702", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159745407079, "ground_truth": 0}, {"key": "40977702", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254062576618, "ground_truth": 0}, {"key": "35336618", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7969253701295891, "ground_truth": 0}, {"key": "35336618", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7918210841585046, "ground_truth": 0}, {"key": "35336618", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8679338383166773, "ground_truth": 0}, {"key": "35336618", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711686352538, "ground_truth": 0}, {"key": "35336618", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.866132511046223, "ground_truth": 0}, {"key": "33024679", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8116760259110891, "ground_truth": 0}, {"key": "33024679", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956580965224461, "ground_truth": 0}, {"key": "33024679", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.856812295171894, "ground_truth": 0}, {"key": "33024679", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213887959525, "ground_truth": 0}, {"key": "33024679", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578368784205, "ground_truth": 0}, {"key": "37451334", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867663542276, "ground_truth": 0}, {"key": "37451334", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7295197706470993, "ground_truth": 0}, {"key": "37451334", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8233283948370397, "ground_truth": 0}, {"key": "37451334", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867984796375, "ground_truth": 0}, {"key": "37451334", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278675853762, "ground_truth": 0}, {"key": "33354824", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.542863295655153, "ground_truth": 0}, {"key": "33354824", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6076631686519872, "ground_truth": 0}, {"key": "33354824", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.3757064479865666, "ground_truth": 0}, {"key": "33354824", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118799858571, "ground_truth": 0}, {"key": "33354824", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019530901822432, "ground_truth": 0}, {"key": "34688538", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8661325119174603, "ground_truth": 0}, {"key": "34688538", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.932943714051098, "ground_truth": 0}, {"key": "34688538", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8766343815256121, "ground_truth": 0}, {"key": "34688538", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277810109401, "ground_truth": 0}, {"key": "34688538", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867814317183, "ground_truth": 0}, {"key": "33646276", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6619228467827565, "ground_truth": 0}, {"key": "33646276", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.707404699490434, "ground_truth": 0}, {"key": "33646276", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6893056056019689, "ground_truth": 0}, {"key": "33646276", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679365956168487, "ground_truth": 0}, {"key": "33646276", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241692498484, "ground_truth": 0}, {"key": "40322608", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.855851143312331, "ground_truth": 0}, {"key": "40322608", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8705972747416196, "ground_truth": 0}, {"key": "40322608", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9319595846159245, "ground_truth": 0}, {"key": "40322608", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473671106736, "ground_truth": 0}, {"key": "40322608", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9184802521063098, "ground_truth": 0}, {"key": "39565762", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8643104566939722, "ground_truth": 0}, {"key": "39565762", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8289388160491888, "ground_truth": 0}, {"key": "39565762", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7122321676987885, "ground_truth": 0}, {"key": "39565762", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998690588001, "ground_truth": 0}, {"key": "39565762", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849495264964, "ground_truth": 0}, {"key": "30534259", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7325918420371971, "ground_truth": 0}, {"key": "30534259", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.782662476662275, "ground_truth": 0}, {"key": "30534259", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6619228740734948, "ground_truth": 0}, {"key": "30534259", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786081913886, "ground_truth": 0}, {"key": "30534259", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802706461692, "ground_truth": 0}, {"key": "39644242", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7549149846551889, "ground_truth": 0}, {"key": "39644242", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6654105388964586, "ground_truth": 0}, {"key": "39644242", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7786492975762541, "ground_truth": 0}, {"key": "39644242", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506390510186, "ground_truth": 0}, {"key": "39644242", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240958640952, "ground_truth": 0}, {"key": "19853740", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6388352940602545, "ground_truth": 0}, {"key": "19853740", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9026096038678509, "ground_truth": 0}, {"key": "19853740", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.830043760861098, "ground_truth": 0}, {"key": "19853740", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256320017508, "ground_truth": 0}, {"key": "19853740", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721888429995, "ground_truth": 0}, {"key": "33023078", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8548846324578542, "ground_truth": 0}, {"key": "33023078", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.92840880107413, "ground_truth": 0}, {"key": "33023078", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.825589725325719, "ground_truth": 0}, {"key": "33023078", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673169472297, "ground_truth": 0}, {"key": "33023078", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748713805741, "ground_truth": 0}, {"key": "38329806", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976089351628495, "ground_truth": 0}, {"key": "38329806", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998560164942, "ground_truth": 0}, {"key": "38329806", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8365545594972327, "ground_truth": 0}, {"key": "38329806", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527518675221, "ground_truth": 0}, {"key": "38329806", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.824461930654526, "ground_truth": 0}, {"key": "38761942", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6909762868180482, "ground_truth": 0}, {"key": "38761942", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9105453947628276, "ground_truth": 0}, {"key": "38761942", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7138307640766735, "ground_truth": 0}, {"key": "38761942", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.917302659254734, "ground_truth": 0}, {"key": "38761942", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199579417353, "ground_truth": 0}, {"key": "33773576", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6224593280849453, "ground_truth": 0}, {"key": "33773576", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7264256086202836, "ground_truth": 0}, {"key": "33773576", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5964331743079412, "ground_truth": 0}, {"key": "33773576", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784205935845, "ground_truth": 0}, {"key": "33773576", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460136853537517, "ground_truth": 0}, {"key": "37642631", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7217432055397667, "ground_truth": 0}, {"key": "37642631", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8606036140220744, "ground_truth": 0}, {"key": "37642631", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6723316837094402, "ground_truth": 0}, {"key": "37642631", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581605667356, "ground_truth": 0}, {"key": "37642631", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382228677124, "ground_truth": 0}, {"key": "36609836", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8723473784862433, "ground_truth": 0}, {"key": "36609836", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7879311986320677, "ground_truth": 0}, {"key": "36609836", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8198933383067906, "ground_truth": 0}, {"key": "36609836", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672256178323, "ground_truth": 0}, {"key": "36609836", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823366875365, "ground_truth": 0}, {"key": "41035610", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7634837662008597, "ground_truth": 0}, {"key": "41035610", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6842640181643678, "ground_truth": 0}, {"key": "41035610", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430472526672, "ground_truth": 0}, {"key": "41035610", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799929332119584, "ground_truth": 0}, {"key": "41035610", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.842863143443689, "ground_truth": 0}, {"key": "37592684", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6842640334698014, "ground_truth": 0}, {"key": "37592684", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672341223649, "ground_truth": 0}, {"key": "37592684", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8198933359244784, "ground_truth": 0}, {"key": "37592684", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789105666397, "ground_truth": 0}, {"key": "37592684", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545716533875, "ground_truth": 0}, {"key": "38951040", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210440999583465, "ground_truth": 0}, {"key": "38951040", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6020616033834656, "ground_truth": 0}, {"key": "38951040", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7606506600187224, "ground_truth": 0}, {"key": "38951040", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760283063295, "ground_truth": 0}, {"key": "38951040", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281686804474, "ground_truth": 0}, {"key": "40774469", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "40774469", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6601723767944434, "ground_truth": 0}, {"key": "40774469", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7853085795390702, "ground_truth": 0}, {"key": "40774469", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269363985742, "ground_truth": 0}, {"key": "40774469", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754408699126, "ground_truth": 0}, {"key": "40876288", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7490872107846361, "ground_truth": 0}, {"key": "40876288", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8140527991568216, "ground_truth": 0}, {"key": "40876288", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879312053065695, "ground_truth": 0}, {"key": "40876288", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416491911203, "ground_truth": 0}, {"key": "40876288", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.571766635477124, "ground_truth": 0}, {"key": "40340131", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867731451331, "ground_truth": 0}, {"key": "40340131", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8092759895730419, "ground_truth": 0}, {"key": "40340131", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7676898552849373, "ground_truth": 0}, {"key": "40340131", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680324535135, "ground_truth": 0}, {"key": "40340131", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743766623603, "ground_truth": 0}, {"key": "30121591", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.819893345933153, "ground_truth": 0}, {"key": "30121591", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545635059944, "ground_truth": 0}, {"key": "30121591", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7759445666026544, "ground_truth": 0}, {"key": "30121591", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333246059863508, "ground_truth": 0}, {"key": "30121591", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772450663509, "ground_truth": 0}, {"key": "35623366", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8791467675934689, "ground_truth": 0}, {"key": "35623366", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7041601406937044, "ground_truth": 0}, {"key": "35623366", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210441105056209, "ground_truth": 0}, {"key": "35623366", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239900641683, "ground_truth": 0}, {"key": "35623366", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998686956694, "ground_truth": 0}, {"key": "41014093", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8255897280720141, "ground_truth": 0}, {"key": "41014093", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8652240814920376, "ground_truth": 0}, {"key": "41014093", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324903764433, "ground_truth": 0}, {"key": "41014093", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646952931051, "ground_truth": 0}, {"key": "41014093", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849578181442, "ground_truth": 0}, {"key": "11387984", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6636689322455084, "ground_truth": 0}, {"key": "11387984", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008948059732582, "ground_truth": 0}, {"key": "11387984", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8509647056421529, "ground_truth": 0}, {"key": "11387984", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437677234064, "ground_truth": 0}, {"key": "11387984", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.789233683693611, "ground_truth": 0}, {"key": "39508312", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8221891439647093, "ground_truth": 0}, {"key": "39508312", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8816148975227993, "ground_truth": 0}, {"key": "39508312", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366825731687, "ground_truth": 0}, {"key": "39508312", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825933836186, "ground_truth": 0}, {"key": "39508312", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228337338923, "ground_truth": 0}, {"key": "35815369", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.781330620919727, "ground_truth": 0}, {"key": "35815369", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7879312031826151, "ground_truth": 0}, {"key": "35815369", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8031737932717724, "ground_truth": 0}, {"key": "35815369", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835399828746, "ground_truth": 0}, {"key": "35815369", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210602693543, "ground_truth": 0}, {"key": "35802823", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.831143034600992, "ground_truth": 0}, {"key": "35802823", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8606036306610413, "ground_truth": 0}, {"key": "35802823", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849524184602, "ground_truth": 0}, {"key": "35802823", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.800692012729662, "ground_truth": 0}, {"key": "35802823", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840483974756, "ground_truth": 0}, {"key": "38499968", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036253651675, "ground_truth": 0}, {"key": "38499968", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6001883891661656, "ground_truth": 0}, {"key": "38499968", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148278130134, "ground_truth": 0}, {"key": "38499968", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254181031195, "ground_truth": 0}, {"key": "38499968", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677545975597, "ground_truth": 0}, {"key": "36926726", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6531269279159805, "ground_truth": 0}, {"key": "36926726", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7356416240031514, "ground_truth": 0}, {"key": "36926726", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.848972207467819, "ground_truth": 0}, {"key": "36926726", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324966655939, "ground_truth": 0}, {"key": "36926726", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437644818159, "ground_truth": 0}, {"key": "40903712", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850380707483, "ground_truth": 0}, {"key": "40903712", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7264255911680647, "ground_truth": 0}, {"key": "40903712", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6706082557429774, "ground_truth": 0}, {"key": "40903712", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210774133627, "ground_truth": 0}, {"key": "40903712", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094570137003, "ground_truth": 0}, {"key": "19614862", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7772998639847782, "ground_truth": 0}, {"key": "19614862", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5234203440145015, "ground_truth": 0}, {"key": "19614862", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8092759866139021, "ground_truth": 0}, {"key": "19614862", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118572099496, "ground_truth": 0}, {"key": "19614862", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442250911964567, "ground_truth": 0}, {"key": "38861704", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7201715042848996, "ground_truth": 0}, {"key": "38861704", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8031737927972536, "ground_truth": 0}, {"key": "38861704", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431680141754872, "ground_truth": 0}, {"key": "38861704", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434839498247, "ground_truth": 0}, {"key": "38861704", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336919256571, "ground_truth": 0}, {"key": "34349607", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585791864925, "ground_truth": 0}, {"key": "34349607", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7892336943298599, "ground_truth": 0}, {"key": "34349607", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8044059095659746, "ground_truth": 0}, {"key": "34349607", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493005778502, "ground_truth": 0}, {"key": "34349607", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358339354814, "ground_truth": 0}, {"key": "20773800", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.3775406553833348, "ground_truth": 0}, {"key": "20773800", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.45132649936735253, "ground_truth": 0}, {"key": "20773800", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.3812195730762979, "ground_truth": 0}, {"key": "20773800", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.45326185298791943, "ground_truth": 0}, {"key": "20773800", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.43590150868440886, "ground_truth": 0}, {"key": "35545608", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6584175199724311, "ground_truth": 0}, {"key": "35545608", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5583270017760671, "ground_truth": 0}, {"key": "35545608", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5409238829111854, "ground_truth": 0}, {"key": "35545608", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366316099618, "ground_truth": 0}, {"key": "35545608", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.651354851187314, "ground_truth": 0}, {"key": "37258984", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.713830754153698, "ground_truth": 0}, {"key": "37258984", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7371581561261878, "ground_truth": 0}, {"key": "37258984", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5486734860626505, "ground_truth": 0}, {"key": "37258984", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813031167055502, "ground_truth": 0}, {"key": "37258984", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269275081208, "ground_truth": 0}, {"key": "37274562", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7592254091394461, "ground_truth": 0}, {"key": "37274562", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8568123028700583, "ground_truth": 0}, {"key": "37274562", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006920066246843, "ground_truth": 0}, {"key": "37274562", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338297373835, "ground_truth": 0}, {"key": "37274562", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897318830544, "ground_truth": 0}, {"key": "40828068", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9485372391932035, "ground_truth": 0}, {"key": "40828068", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8633916092240809, "ground_truth": 0}, {"key": "40828068", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9219218381556412, "ground_truth": 0}, {"key": "40828068", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110498640888, "ground_truth": 0}, {"key": "40828068", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755765423033, "ground_truth": 0}, {"key": "37807180", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8376199643826742, "ground_truth": 0}, {"key": "37807180", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199738333009, "ground_truth": 0}, {"key": "37807180", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.884837771132626, "ground_truth": 0}, {"key": "37807180", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099579077968, "ground_truth": 0}, {"key": "37807180", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9092645118690686, "ground_truth": 0}, {"key": "40748607", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9362850071940316, "ground_truth": 0}, {"key": "40748607", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9734434289785616, "ground_truth": 0}, {"key": "40748607", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9666631754916191, "ground_truth": 0}, {"key": "40748607", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9390248138662435, "ground_truth": 0}, {"key": "40748607", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240146168296, "ground_truth": 0}, {"key": "40123819", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8175744784137355, "ground_truth": 0}, {"key": "40123819", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008948157214128, "ground_truth": 0}, {"key": "40123819", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8469578493140373, "ground_truth": 0}, {"key": "40123819", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920161183042, "ground_truth": 0}, {"key": "40123819", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.80927595832831, "ground_truth": 0}, {"key": "38453867", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7233094741367277, "ground_truth": 0}, {"key": "38453867", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6388352746174707, "ground_truth": 0}, {"key": "38453867", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6959583631057663, "ground_truth": 0}, {"key": "38453867", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059174762755, "ground_truth": 0}, {"key": "38453867", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191419146776, "ground_truth": 0}, {"key": "38944856", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9284088077673118, "ground_truth": 0}, {"key": "38944856", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9319595824572837, "ground_truth": 0}, {"key": "38944856", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869869412488, "ground_truth": 0}, {"key": "38944856", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9105453936933022, "ground_truth": 0}, {"key": "38944856", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068786311555, "ground_truth": 0}, {"key": "35778898", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9142907201539446, "ground_truth": 0}, {"key": "35778898", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142402721213, "ground_truth": 0}, {"key": "35778898", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884841789166, "ground_truth": 0}, {"key": "35778898", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343759204523, "ground_truth": 0}, {"key": "35778898", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354878014421, "ground_truth": 0}, {"key": "32530125", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6548947289699442, "ground_truth": 0}, {"key": "32530125", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7325918491509221, "ground_truth": 0}, {"key": "32530125", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6388352758893324, "ground_truth": 0}, {"key": "32530125", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118790773203, "ground_truth": 0}, {"key": "32530125", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254055407174, "ground_truth": 0}, {"key": "35010363", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6740504522470083, "ground_truth": 0}, {"key": "35010363", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5698526290369772, "ground_truth": 0}, {"key": "35010363", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5964331293350575, "ground_truth": 0}, {"key": "35010363", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197718779831, "ground_truth": 0}, {"key": "35010363", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494539498835, "ground_truth": 0}, {"key": "27514800", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8519528054993923, "ground_truth": 0}, {"key": "27514800", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.838679739205605, "ground_truth": 0}, {"key": "27514800", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8679338361975348, "ground_truth": 0}, {"key": "27514800", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366575958847, "ground_truth": 0}, {"key": "27514800", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354864360892, "ground_truth": 0}, {"key": "25725840", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5717666098080844, "ground_truth": 0}, {"key": "25725840", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6297746232114656, "ground_truth": 0}, {"key": "25725840", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5774953684408706, "ground_truth": 0}, {"key": "25725840", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689529026306, "ground_truth": 0}, {"key": "25725840", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796906325432, "ground_truth": 0}, {"key": "38327225", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.851952810222854, "ground_truth": 0}, {"key": "38327225", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8407825750677967, "ground_truth": 0}, {"key": "38327225", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7866228432834305, "ground_truth": 0}, {"key": "38327225", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149697736691, "ground_truth": 0}, {"key": "38327225", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672180975338, "ground_truth": 0}, {"key": "11991724", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8187368017752806, "ground_truth": 0}, {"key": "11991724", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8509647094015396, "ground_truth": 0}, {"key": "11991724", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148209237921, "ground_truth": 0}, {"key": "11991724", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772364046412, "ground_truth": 0}, {"key": "11991724", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063725825939, "ground_truth": 0}, {"key": "32217545", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8056322079157964, "ground_truth": 0}, {"key": "32217545", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8969755843335809, "ground_truth": 0}, {"key": "32217545", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8749346102804196, "ground_truth": 0}, {"key": "32217545", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281508763472, "ground_truth": 0}, {"key": "32217545", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031738086705825, "ground_truth": 0}, {"key": "12731847", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493286156655, "ground_truth": 0}, {"key": "12731847", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.827828158520962, "ground_truth": 0}, {"key": "12731847", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6791787017053311, "ground_truth": 0}, {"key": "12731847", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936494145661, "ground_truth": 0}, {"key": "12731847", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.737158189383903, "ground_truth": 0}, {"key": "36827234", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104789015532946, "ground_truth": 0}, {"key": "36827234", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7074046888217168, "ground_truth": 0}, {"key": "36827234", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757870037010301, "ground_truth": 0}, {"key": "36827234", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700919214127, "ground_truth": 0}, {"key": "36827234", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545606655997, "ground_truth": 0}, {"key": "29111539", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.769080243073115, "ground_truth": 0}, {"key": "29111539", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9046505407357824, "ground_truth": 0}, {"key": "29111539", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8740772259658721, "ground_truth": 0}, {"key": "29111539", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823380486515, "ground_truth": 0}, {"key": "29111539", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677605450248, "ground_truth": 0}, {"key": "37763052", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7295197876249047, "ground_truth": 0}, {"key": "37763052", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199673681117, "ground_truth": 0}, {"key": "37763052", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430475952218, "ground_truth": 0}, {"key": "37763052", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354911803647, "ground_truth": 0}, {"key": "37763052", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675337315917, "ground_truth": 0}, {"key": "30682335", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6671476632606483, "ground_truth": 0}, {"key": "30682335", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7690802444992866, "ground_truth": 0}, {"key": "30682335", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6992544369670527, "ground_truth": 0}, {"key": "30682335", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666463821038, "ground_truth": 0}, {"key": "30682335", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918219083736, "ground_truth": 0}, {"key": "12261276", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.32252598852378433, "ground_truth": 0}, {"key": "12261276", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5273165252060458, "ground_truth": 0}, {"key": "12261276", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.36296919759804364, "ground_truth": 0}, {"key": "12261276", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.33982761884426554, "ground_truth": 0}, {"key": "12261276", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262801360907, "ground_truth": 0}, {"key": "36912979", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4921881525890687, "ground_truth": 0}, {"key": "36912979", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5945512692513051, "ground_truth": 0}, {"key": "36912979", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5039061624837676, "ground_truth": 0}, {"key": "36912979", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233683825592325, "ground_truth": 0}, {"key": "36912979", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557749119997966, "ground_truth": 0}, {"key": "30205259", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.907312218250586, "ground_truth": 0}, {"key": "30205259", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9416541580994676, "ground_truth": 0}, {"key": "30205259", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9263037287820394, "ground_truth": 0}, {"key": "30205259", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9241418153680102, "ground_truth": 0}, {"key": "30205259", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942241549467, "ground_truth": 0}, {"key": "39458032", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9802808719782788, "ground_truth": 0}, {"key": "39458032", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9623913656175674, "ground_truth": 0}, {"key": "39458032", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9671630446528302, "ground_truth": 0}, {"key": "39458032", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9539660963194657, "ground_truth": 0}, {"key": "39458032", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9621075740433072, "ground_truth": 0}, {"key": "35116452", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4629586146911103, "ground_truth": 0}, {"key": "35116452", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5467381681058999, "ground_truth": 0}, {"key": "35116452", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6187804204327249, "ground_truth": 0}, {"key": "35116452", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463118190966386, "ground_truth": 0}, {"key": "35116452", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185161902334, "ground_truth": 0}, {"key": "40107476", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867840215494, "ground_truth": 0}, {"key": "40107476", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9420819105784766, "ground_truth": 0}, {"key": "40107476", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718434887511835, "ground_truth": 0}, {"key": "40107476", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253883054939, "ground_truth": 0}, {"key": "40107476", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918532594229, "ground_truth": 0}, {"key": "39501049", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9385759578413351, "ground_truth": 0}, {"key": "39501049", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9465966713475891, "ground_truth": 0}, {"key": "39501049", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9525741209530855, "ground_truth": 0}, {"key": "39501049", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9449947100456239, "ground_truth": 0}, {"key": "39501049", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942019048015, "ground_truth": 0}, {"key": "39642178", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5813030870785352, "ground_truth": 0}, {"key": "39642178", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7041601349804144, "ground_truth": 0}, {"key": "39642178", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118676911491, "ground_truth": 0}, {"key": "39642178", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640204202087, "ground_truth": 0}, {"key": "39642178", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.672331682407691, "ground_truth": 0}, {"key": "38024796", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7648916098785814, "ground_truth": 0}, {"key": "38024796", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7386690955010415, "ground_truth": 0}, {"key": "38024796", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118780014901, "ground_truth": 0}, {"key": "38024796", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759691990753, "ground_truth": 0}, {"key": "38024796", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020616285897488, "ground_truth": 0}, {"key": "36652079", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6460136640629299, "ground_truth": 0}, {"key": "36652079", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8418256626124458, "ground_truth": 0}, {"key": "36652079", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.731058572449998, "ground_truth": 0}, {"key": "36652079", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117843542441, "ground_truth": 0}, {"key": "36652079", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582606881736, "ground_truth": 0}, {"key": "32193402", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437719194279, "ground_truth": 0}, {"key": "32193402", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8056321833718098, "ground_truth": 0}, {"key": "32193402", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142468148614, "ground_truth": 0}, {"key": "32193402", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377800031051, "ground_truth": 0}, {"key": "32193402", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297976298399, "ground_truth": 0}, {"key": "32589706", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036129068108, "ground_truth": 0}, {"key": "32589706", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392890043595, "ground_truth": 0}, {"key": "32589706", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8386797600371859, "ground_truth": 0}, {"key": "32589706", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085809803849, "ground_truth": 0}, {"key": "32589706", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441113132781, "ground_truth": 0}, {"key": "38590589", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5926666196410311, "ground_truth": 0}, {"key": "38590589", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7969253774208724, "ground_truth": 0}, {"key": "38590589", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.677474018758245, "ground_truth": 0}, {"key": "38590589", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117952568549, "ground_truth": 0}, {"key": "38590589", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094540630808, "ground_truth": 0}, {"key": "37045414", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9666631746198882, "ground_truth": 0}, {"key": "37045414", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9637799467093981, "ground_truth": 0}, {"key": "37045414", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9600626825833698, "ground_truth": 0}, {"key": "37045414", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9637799424757627, "ground_truth": 0}, {"key": "37045414", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.983470444199222, "ground_truth": 0}, {"key": "33310095", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8895288538692556, "ground_truth": 0}, {"key": "33310095", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8311430572763078, "ground_truth": 0}, {"key": "33310095", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8962513756853763, "ground_truth": 0}, {"key": "33310095", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9674102558498674, "ground_truth": 0}, {"key": "33310095", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513693843692, "ground_truth": 0}, {"key": "37934604", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7704647833907606, "ground_truth": 0}, {"key": "37934604", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7981867871160617, "ground_truth": 0}, {"key": "37934604", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324787034237, "ground_truth": 0}, {"key": "37934604", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346279248602, "ground_truth": 0}, {"key": "37934604", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324745431007, "ground_truth": 0}, {"key": "39012181", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.990063581879805, "ground_truth": 0}, {"key": "39012181", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9742394412051436, "ground_truth": 0}, {"key": "39012181", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9796676464797252, "ground_truth": 0}, {"key": "39012181", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.987852829485346, "ground_truth": 0}, {"key": "39012181", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9874720663114513, "ground_truth": 0}, {"key": "40221674", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9039745089629829, "ground_truth": 0}, {"key": "40221674", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.905322295055803, "ground_truth": 0}, {"key": "40221674", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9372107900509377, "ground_truth": 0}, {"key": "40221674", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086179041338425, "ground_truth": 0}, {"key": "40221674", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.949294631598518, "ground_truth": 0}, {"key": "36884862", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8056322044526648, "ground_truth": 0}, {"key": "36884862", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8732148249278588, "ground_truth": 0}, {"key": "36884862", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8816149108806308, "ground_truth": 0}, {"key": "36884862", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970744795112, "ground_truth": 0}, {"key": "36884862", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772358474168, "ground_truth": 0}, {"key": "39054429", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7248702677995268, "ground_truth": 0}, {"key": "39054429", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8910549637909502, "ground_truth": 0}, {"key": "39054429", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159538179746, "ground_truth": 0}, {"key": "39054429", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575449576656, "ground_truth": 0}, {"key": "39054429", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867872779176, "ground_truth": 0}, {"key": "36753964", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7745833948641698, "ground_truth": 0}, {"key": "36753964", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7356416284019902, "ground_truth": 0}, {"key": "36753964", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6619228590437244, "ground_truth": 0}, {"key": "36753964", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833947105789, "ground_truth": 0}, {"key": "36753964", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102773813401, "ground_truth": 0}, {"key": "37612459", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.890294228614213, "ground_truth": 0}, {"key": "37612459", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9167080691459247, "ground_truth": 0}, {"key": "37612459", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9230391621040439, "ground_truth": 0}, {"key": "37612459", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797066069948, "ground_truth": 0}, {"key": "37612459", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677507265929, "ground_truth": 0}, {"key": "36805789", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8848377790994293, "ground_truth": 0}, {"key": "36805789", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.969324196425886, "ground_truth": 0}, {"key": "36805789", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9284088094816974, "ground_truth": 0}, {"key": "36805789", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213782927612, "ground_truth": 0}, {"key": "36805789", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576155194545, "ground_truth": 0}, {"key": "12757394", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6723317023408838, "ground_truth": 0}, {"key": "12757394", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526256093437, "ground_truth": 0}, {"key": "12757394", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7620701090768096, "ground_truth": 0}, {"key": "12757394", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701053509982, "ground_truth": 0}, {"key": "12757394", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264255959438094, "ground_truth": 0}, {"key": "32192542", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9399133491736101, "ground_truth": 0}, {"key": "32192542", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9815951089998495, "ground_truth": 0}, {"key": "32192542", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9732407164481263, "ground_truth": 0}, {"key": "32192542", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942268687147, "ground_truth": 0}, {"key": "32192542", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9661559677571248, "ground_truth": 0}, {"key": "34856060", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159453805782, "ground_truth": 0}, {"key": "34856060", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7233094671439423, "ground_truth": 0}, {"key": "34856060", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872125079685, "ground_truth": 0}, {"key": "34856060", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512176839694, "ground_truth": 0}, {"key": "34856060", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935177735863, "ground_truth": 0}, {"key": "36083416", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9473810511621393, "ground_truth": 0}, {"key": "36083416", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9585377288252175, "ground_truth": 0}, {"key": "36083416", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9118099497000409, "ground_truth": 0}, {"key": "36083416", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9420819106281992, "ground_truth": 0}, {"key": "36083416", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9449947141681794, "ground_truth": 0}, {"key": "33839050", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5736783782440964, "ground_truth": 0}, {"key": "33839050", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424324707666106, "ground_truth": 0}, {"key": "33839050", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6113819697003785, "ground_truth": 0}, {"key": "33839050", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106283160874036, "ground_truth": 0}, {"key": "33839050", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591305320644, "ground_truth": 0}, {"key": "18464690", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8428631527814046, "ground_truth": 0}, {"key": "18464690", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7606506487714779, "ground_truth": 0}, {"key": "18464690", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7931059509522188, "ground_truth": 0}, {"key": "18464690", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191265756665, "ground_truth": 0}, {"key": "18464690", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321806604638, "ground_truth": 0}, {"key": "39212665", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.3886180111459048, "ground_truth": 0}, {"key": "39212665", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.3942009658151667, "ground_truth": 0}, {"key": "39212665", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.3539863067839295, "ground_truth": 0}, {"key": "39212665", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061724241044, "ground_truth": 0}, {"key": "39212665", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.573678399109762, "ground_truth": 0}, {"key": "40094011", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8056321979315598, "ground_truth": 0}, {"key": "40094011", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6959583303974288, "ground_truth": 0}, {"key": "40094011", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7690802596726671, "ground_truth": 0}, {"key": "40094011", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303245375599, "ground_truth": 0}, {"key": "40094011", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701170306192, "ground_truth": 0}, {"key": "36036272", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7446563309292491, "ground_truth": 0}, {"key": "36036272", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799928987741053, "ground_truth": 0}, {"key": "36036272", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998501750921, "ground_truth": 0}, {"key": "36036272", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.89181104195585, "ground_truth": 0}, {"key": "36036272", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303254757142, "ground_truth": 0}, {"key": "30681904", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7549150016526337, "ground_truth": 0}, {"key": "30681904", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7839884667910181, "ground_truth": 0}, {"key": "30681904", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6876299990561323, "ground_truth": 0}, {"key": "30681904", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366585817654, "ground_truth": 0}, {"key": "30681904", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737437378419, "ground_truth": 0}, {"key": "27834240", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5869964215490185, "ground_truth": 0}, {"key": "27834240", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7106283067314655, "ground_truth": 0}, {"key": "27834240", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7217432025312001, "ground_truth": 0}, {"key": "27834240", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159511294277, "ground_truth": 0}, {"key": "27834240", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241883121483, "ground_truth": 0}, {"key": "35025075", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082834034828, "ground_truth": 0}, {"key": "35025075", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8652240769494752, "ground_truth": 0}, {"key": "35025075", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581840451468, "ground_truth": 0}, {"key": "35025075", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136839694047, "ground_truth": 0}, {"key": "35025075", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575478009645, "ground_truth": 0}, {"key": "33316985", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303157682348, "ground_truth": 0}, {"key": "33316985", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300478133145, "ground_truth": 0}, {"key": "33316985", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7090191483970579, "ground_truth": 0}, {"key": "33316985", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312013516707, "ground_truth": 0}, {"key": "33316985", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224401373977, "ground_truth": 0}, {"key": "17037056", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5698526405701773, "ground_truth": 0}, {"key": "17037056", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5563995790082237, "ground_truth": 0}, {"key": "17037056", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6876300130510762, "ground_truth": 0}, {"key": "17037056", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136977167077, "ground_truth": 0}, {"key": "17037056", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216090294466, "ground_truth": 0}, {"key": "34050457", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8661325068348268, "ground_truth": 0}, {"key": "34050457", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8910549588668677, "ground_truth": 0}, {"key": "34050457", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.926303730327162, "ground_truth": 0}, {"key": "34050457", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.853912755450927, "ground_truth": 0}, {"key": "34050457", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.924687690530038, "ground_truth": 0}, {"key": "34713745", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6513548841965124, "ground_truth": 0}, {"key": "34713745", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6601723798615726, "ground_truth": 0}, {"key": "34713745", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5602526303609584, "ground_truth": 0}, {"key": "34713745", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995632551805, "ground_truth": 0}, {"key": "34713745", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666106145453, "ground_truth": 0}, {"key": "40856210", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5389832026035772, "ground_truth": 0}, {"key": "40856210", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6242935433824225, "ground_truth": 0}, {"key": "40856210", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4726834814658078, "ground_truth": 0}, {"key": "40856210", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666310986075, "ground_truth": 0}, {"key": "40856210", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995931018779, "ground_truth": 0}, {"key": "40848302", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8459424456847078, "ground_truth": 0}, {"key": "40848302", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7759445467344, "ground_truth": 0}, {"key": "40848302", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8539127501409389, "ground_truth": 0}, {"key": "40848302", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916115922585, "ground_truth": 0}, {"key": "40848302", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333246188294389, "ground_truth": 0}, {"key": "40636168", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9005297957070615, "ground_truth": 0}, {"key": "40636168", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9294404038038857, "ground_truth": 0}, {"key": "40636168", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8774767791658095, "ground_truth": 0}, {"key": "40636168", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354932235085, "ground_truth": 0}, {"key": "40636168", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045938408003, "ground_truth": 0}, {"key": "34423311", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267117819179144, "ground_truth": 0}, {"key": "34423311", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6297746297494786, "ground_truth": 0}, {"key": "34423311", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366565759752, "ground_truth": 0}, {"key": "34423311", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256190444417, "ground_truth": 0}, {"key": "34423311", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943601937184, "ground_truth": 0}, {"key": "34833945", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9763105292399862, "ground_truth": 0}, {"key": "34833945", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9730365030834847, "ground_truth": 0}, {"key": "34833945", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9615338039467216, "ground_truth": 0}, {"key": "34833945", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9842154394396527, "ground_truth": 0}, {"key": "34833945", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9579122723755362, "ground_truth": 0}, {"key": "21272328", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6150878436345593, "ground_truth": 0}, {"key": "21272328", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343892163336, "ground_truth": 0}, {"key": "21272328", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8056321740772686, "ground_truth": 0}, {"key": "21272328", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982191542881, "ground_truth": 0}, {"key": "21272328", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575425219343, "ground_truth": 0}, {"key": "38648957", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6039318555886006, "ground_truth": 0}, {"key": "38648957", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.667147671414055, "ground_truth": 0}, {"key": "38648957", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581435344797, "ground_truth": 0}, {"key": "38648957", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953691622994, "ground_truth": 0}, {"key": "38648957", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358584509778, "ground_truth": 0}, {"key": "24942981", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4824291377288007, "ground_truth": 0}, {"key": "24942981", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.47268345061375394, "ground_truth": 0}, {"key": "24942981", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.46490158768528755, "ground_truth": 0}, {"key": "24942981", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199186403178, "ground_truth": 0}, {"key": "24942981", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.42250462963785484, "ground_truth": 0}, {"key": "35882366", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7248702829603367, "ground_truth": 0}, {"key": "35882366", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8933093974902758, "ground_truth": 0}, {"key": "35882366", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6279512114390173, "ground_truth": 0}, {"key": "35882366", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688444086333, "ground_truth": 0}, {"key": "35882366", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.577495376924086, "ground_truth": 0}, {"key": "40559523", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8643104616501324, "ground_truth": 0}, {"key": "40559523", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8791467781699887, "ground_truth": 0}, {"key": "40559523", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8438950996868881, "ground_truth": 0}, {"key": "40559523", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527992351335, "ground_truth": 0}, {"key": "40559523", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619201343372, "ground_truth": 0}, {"key": "24632722", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7106282995977057, "ground_truth": 0}, {"key": "24632722", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.49218810934463403, "ground_truth": 0}, {"key": "24632722", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.577495351976281, "ground_truth": 0}, {"key": "24632722", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118527080938, "ground_truth": 0}, {"key": "24632722", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.737158171115145, "ground_truth": 0}, {"key": "36002759", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082779864787, "ground_truth": 0}, {"key": "36002759", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.674050470471946, "ground_truth": 0}, {"key": "36002759", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6706082729713903, "ground_truth": 0}, {"key": "36002759", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.4513264840260061, "ground_truth": 0}, {"key": "36002759", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238660615965, "ground_truth": 0}, {"key": "29508534", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059530264302, "ground_truth": 0}, {"key": "29508534", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7248702853240722, "ground_truth": 0}, {"key": "29508534", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006920148810939, "ground_truth": 0}, {"key": "29508534", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825738252847, "ground_truth": 0}, {"key": "29508534", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.734119541983964, "ground_truth": 0}, {"key": "15631612", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511608807008, "ground_truth": 0}, {"key": "15631612", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619247712639, "ground_truth": 0}, {"key": "15631612", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7956580940831959, "ground_truth": 0}, {"key": "15631612", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142483013984, "ground_truth": 0}, {"key": "15631612", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869920325718, "ground_truth": 0}, {"key": "40731892", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4551986187535714, "ground_truth": 0}, {"key": "40731892", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5312093735537897, "ground_truth": 0}, {"key": "40731892", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6859494497738321, "ground_truth": 0}, {"key": "40731892", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307615369303, "ground_truth": 0}, {"key": "40731892", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.598312213315896, "ground_truth": 0}, {"key": "35971910", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526292944593, "ground_truth": 0}, {"key": "35971910", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9329437155758408, "ground_truth": 0}, {"key": "35971910", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256474629643, "ground_truth": 0}, {"key": "35971910", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505383713536, "ground_truth": 0}, {"key": "35971910", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122252514867, "ground_truth": 0}, {"key": "34428424", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9579122748983022, "ground_truth": 0}, {"key": "34428424", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9348724473637425, "ground_truth": 0}, {"key": "34428424", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9661559641817673, "ground_truth": 0}, {"key": "34428424", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9651191139753046, "ground_truth": 0}, {"key": "34428424", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9763105271389155, "ground_truth": 0}, {"key": "36971005", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9612438066399689, "ground_truth": 0}, {"key": "36971005", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9416541590720813, "ground_truth": 0}, {"key": "36971005", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9353465147751673, "ground_truth": 0}, {"key": "36971005", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9294403993588493, "ground_truth": 0}, {"key": "36971005", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9453993992176067, "ground_truth": 0}, {"key": "34649067", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7106282873014488, "ground_truth": 0}, {"key": "34649067", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.709019136234303, "ground_truth": 0}, {"key": "34649067", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7201715141993514, "ground_truth": 0}, {"key": "34649067", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876300084599667, "ground_truth": 0}, {"key": "34649067", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867813452173, "ground_truth": 0}, {"key": "37355154", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7745833820057579, "ground_truth": 0}, {"key": "37355154", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059511707204, "ground_truth": 0}, {"key": "37355154", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148292538047, "ground_truth": 0}, {"key": "37355154", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.783988461742308, "ground_truth": 0}, {"key": "37355154", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802429959078, "ground_truth": 0}, {"key": "38674697", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324893466164, "ground_truth": 0}, {"key": "38674697", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.627951231490191, "ground_truth": 0}, {"key": "38674697", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6513548554937276, "ground_truth": 0}, {"key": "38674697", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689519090198, "ground_truth": 0}, {"key": "38674697", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423209330392, "ground_truth": 0}, {"key": "40525767", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9724147165543486, "ground_truth": 0}, {"key": "40525767", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9791955099600731, "ground_truth": 0}, {"key": "40525767", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9582261219702787, "ground_truth": 0}, {"key": "40525767", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9621075728937344, "ground_truth": 0}, {"key": "40525767", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9390248180678163, "ground_truth": 0}, {"key": "27165110", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.626124143423445, "ground_truth": 0}, {"key": "27165110", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.41300357664606585, "ground_truth": 0}, {"key": "27165110", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5869964426275648, "ground_truth": 0}, {"key": "27165110", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563288619635, "ground_truth": 0}, {"key": "27165110", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666055570966, "ground_truth": 0}, {"key": "35497491", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7956580825381249, "ground_truth": 0}, {"key": "35497491", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8418256450006008, "ground_truth": 0}, {"key": "35497491", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.764891625006988, "ground_truth": 0}, {"key": "35497491", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619371696535, "ground_truth": 0}, {"key": "35497491", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.86246752828908, "ground_truth": 0}, {"key": "40690716", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8233283940328308, "ground_truth": 0}, {"key": "40690716", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.869714583113189, "ground_truth": 0}, {"key": "40690716", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9284087931516114, "ground_truth": 0}, {"key": "40690716", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923189507284, "ground_truth": 0}, {"key": "40690716", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9518632321496227, "ground_truth": 0}, {"key": "34835193", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9790357584694748, "ground_truth": 0}, {"key": "34835193", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9828232916401053, "ground_truth": 0}, {"key": "34835193", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9706877703839648, "ground_truth": 0}, {"key": "34835193", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9780517480757328, "ground_truth": 0}, {"key": "34835193", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9669140206935771, "ground_truth": 0}, {"key": "39471712", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6150878507241877, "ground_truth": 0}, {"key": "39471712", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998464760371, "ground_truth": 0}, {"key": "39471712", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998586930676, "ground_truth": 0}, {"key": "39471712", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358449749959, "ground_truth": 0}, {"key": "39471712", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620700942392384, "ground_truth": 0}, {"key": "39115192", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.904650536735376, "ground_truth": 0}, {"key": "39115192", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9053222975182852, "ground_truth": 0}, {"key": "39115192", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519527878052765, "ground_truth": 0}, {"key": "39115192", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085761582176, "ground_truth": 0}, {"key": "39115192", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673006442095, "ground_truth": 0}, {"key": "23520673", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.43398147273755916, "ground_truth": 0}, {"key": "23520673", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5602526446744762, "ground_truth": 0}, {"key": "23520673", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5832033640869387, "ground_truth": 0}, {"key": "23520673", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666157216696, "ground_truth": 0}, {"key": "23520673", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420094840026737, "ground_truth": 0}, {"key": "35764233", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6150878505568713, "ground_truth": 0}, {"key": "35764233", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8652240767186649, "ground_truth": 0}, {"key": "35764233", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7386690707084003, "ground_truth": 0}, {"key": "35764233", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837586796033, "ground_truth": 0}, {"key": "35764233", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833779095485, "ground_truth": 0}, {"key": "35228910", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6442251145452033, "ground_truth": 0}, {"key": "35228910", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6774739994774949, "ground_truth": 0}, {"key": "35228910", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.48438009426121587, "ground_truth": 0}, {"key": "35228910", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494483943913, "ground_truth": 0}, {"key": "35228910", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.569852633501937, "ground_truth": 0}, {"key": "36795599", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9372107918336121, "ground_truth": 0}, {"key": "36795599", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9504109791261083, "ground_truth": 0}, {"key": "36795599", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9658995710650875, "ground_truth": 0}, {"key": "36795599", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9376689618861738, "ground_truth": 0}, {"key": "36795599", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9407897486169065, "ground_truth": 0}, {"key": "38641949", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059524452942, "ground_truth": 0}, {"key": "38641949", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233284012836027, "ground_truth": 0}, {"key": "38641949", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.814052828200455, "ground_truth": 0}, {"key": "38641949", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549150070982236, "ground_truth": 0}, {"key": "38641949", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891394889502, "ground_truth": 0}, {"key": "29968443", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9136765280773937, "ground_truth": 0}, {"key": "29968443", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9252299575500281, "ground_truth": 0}, {"key": "29968443", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9224823431974454, "ground_truth": 0}, {"key": "29968443", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359901187473, "ground_truth": 0}, {"key": "29968443", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923134904332, "ground_truth": 0}, {"key": "21268042", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6442251174726009, "ground_truth": 0}, {"key": "21268042", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799928948699658, "ground_truth": 0}, {"key": "21268042", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6825737451041285, "ground_truth": 0}, {"key": "21268042", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952983713786, "ground_truth": 0}, {"key": "21268042", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.771843504393148, "ground_truth": 0}, {"key": "26808572", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.831143057605258, "ground_truth": 0}, {"key": "26808572", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7505527721470998, "ground_truth": 0}, {"key": "26808572", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8031737987515759, "ground_truth": 0}, {"key": "26808572", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867723943308, "ground_truth": 0}, {"key": "26808572", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324759391757, "ground_truth": 0}, {"key": "37829390", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666464656655, "ground_truth": 0}, {"key": "37829390", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8031737905206945, "ground_truth": 0}, {"key": "37829390", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587923060112, "ground_truth": 0}, {"key": "37829390", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700962604288, "ground_truth": 0}, {"key": "37829390", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354831652878, "ground_truth": 0}, {"key": "35716045", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.847967762497393, "ground_truth": 0}, {"key": "35716045", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.831143053602484, "ground_truth": 0}, {"key": "35716045", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.846957844522692, "ground_truth": 0}, {"key": "35716045", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933266164887, "ground_truth": 0}, {"key": "35716045", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339665747483, "ground_truth": 0}, {"key": "34367070", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9324533080841632, "ground_truth": 0}, {"key": "34367070", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9412234448228644, "ground_truth": 0}, {"key": "34367070", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9661559676298276, "ground_truth": 0}, {"key": "34367070", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942177106069, "ground_truth": 0}, {"key": "34367070", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.94659667035457, "ground_truth": 0}, {"key": "35239748", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8774767947968363, "ground_truth": 0}, {"key": "35239748", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8643104444752167, "ground_truth": 0}, {"key": "35239748", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.890294227655686, "ground_truth": 0}, {"key": "35239748", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281665641101, "ground_truth": 0}, {"key": "35239748", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671415090446, "ground_truth": 0}, {"key": "40421370", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7853085872185207, "ground_truth": 0}, {"key": "40421370", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185943857098954, "ground_truth": 0}, {"key": "40421370", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416691990261, "ground_truth": 0}, {"key": "40421370", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106282776452274, "ground_truth": 0}, {"key": "40421370", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544195525265, "ground_truth": 0}, {"key": "37288396", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9190632962787466, "ground_truth": 0}, {"key": "37288396", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7648916189086943, "ground_truth": 0}, {"key": "37288396", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8984105687804476, "ground_truth": 0}, {"key": "37288396", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998593134939, "ground_truth": 0}, {"key": "37288396", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759735391033, "ground_truth": 0}, {"key": "38903688", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8459424289793311, "ground_truth": 0}, {"key": "38903688", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9358173615230131, "ground_truth": 0}, {"key": "38903688", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8848377701028599, "ground_truth": 0}, {"key": "38903688", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145775226188, "ground_truth": 0}, {"key": "38903688", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647181219943, "ground_truth": 0}, {"key": "28071228", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9213576176698324, "ground_truth": 0}, {"key": "28071228", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9257686316523284, "ground_truth": 0}, {"key": "28071228", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9433475702776681, "ground_truth": 0}, {"key": "28071228", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745102740064, "ground_truth": 0}, {"key": "28071228", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549501320503, "ground_truth": 0}, {"key": "36855834", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7969253709598262, "ground_truth": 0}, {"key": "36855834", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8278281516175144, "ground_truth": 0}, {"key": "36855834", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998491364033, "ground_truth": 0}, {"key": "36855834", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.921921834221616, "ground_truth": 0}, {"key": "36855834", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278620411665, "ground_truth": 0}, {"key": "40548717", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6076631684035118, "ground_truth": 0}, {"key": "40548717", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7461390029352984, "ground_truth": 0}, {"key": "40548717", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7217432079321501, "ground_truth": 0}, {"key": "40548717", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585543967788, "ground_truth": 0}, {"key": "40548717", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366011805145, "ground_truth": 0}, {"key": "37051175", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7371581556813821, "ground_truth": 0}, {"key": "37051175", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8519528108379818, "ground_truth": 0}, {"key": "37051175", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.49804687640886824, "ground_truth": 0}, {"key": "37051175", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.677474018368217, "ground_truth": 0}, {"key": "37051175", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441148798744, "ground_truth": 0}, {"key": "38882119", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.858718589722661, "ground_truth": 0}, {"key": "38882119", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7690802316555917, "ground_truth": 0}, {"key": "38882119", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8068526388369418, "ground_truth": 0}, {"key": "38882119", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354755091141, "ground_truth": 0}, {"key": "38882119", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575816597509, "ground_truth": 0}, {"key": "19485402", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431679985441675, "ground_truth": 0}, {"key": "19485402", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424324485531081, "ground_truth": 0}, {"key": "19485402", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8624675266213613, "ground_truth": 0}, {"key": "19485402", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744747857833, "ground_truth": 0}, {"key": "19485402", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.713830771306965, "ground_truth": 0}, {"key": "36060907", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9207896778855728, "ground_truth": 0}, {"key": "36060907", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9111797092252851, "ground_truth": 0}, {"key": "36060907", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9559813469346096, "ground_truth": 0}, {"key": "36060907", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9525741289943516, "ground_truth": 0}, {"key": "36060907", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277709571507, "ground_truth": 0}, {"key": "24037309", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.93812401563031, "ground_truth": 0}, {"key": "24037309", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9556514189217183, "ground_truth": 0}, {"key": "24037309", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9539660993739401, "ground_truth": 0}, {"key": "24037309", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9706877694441403, "ground_truth": 0}, {"key": "24037309", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9518632291348331, "ground_truth": 0}, {"key": "35605805", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7826624768716797, "ground_truth": 0}, {"key": "35605805", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006920005539884, "ground_truth": 0}, {"key": "35605805", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7813306272346943, "ground_truth": 0}, {"key": "35605805", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357581603491, "ground_truth": 0}, {"key": "35605805", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245958839894, "ground_truth": 0}, {"key": "17706248", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7918210711541347, "ground_truth": 0}, {"key": "17706248", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.795658098692447, "ground_truth": 0}, {"key": "17706248", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7057850322146842, "ground_truth": 0}, {"key": "17706248", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210574964283, "ground_truth": 0}, {"key": "17706248", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878397450443, "ground_truth": 0}, {"key": "36883559", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8333245973056134, "ground_truth": 0}, {"key": "36883559", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760237452738, "ground_truth": 0}, {"key": "36883559", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210627219002, "ground_truth": 0}, {"key": "36883559", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8955226748862131, "ground_truth": 0}, {"key": "36883559", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970752663067, "ground_truth": 0}, {"key": "32799471", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8740772258624245, "ground_truth": 0}, {"key": "32799471", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8104789125788713, "ground_truth": 0}, {"key": "32799471", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743611298849, "ground_truth": 0}, {"key": "32799471", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.731058592102849, "ground_truth": 0}, {"key": "32799471", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366486195636, "ground_truth": 0}, {"key": "34797243", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6315942891424465, "ground_truth": 0}, {"key": "34797243", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7310585699202122, "ground_truth": 0}, {"key": "34797243", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.771843505730851, "ground_truth": 0}, {"key": "34797243", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228750431118, "ground_truth": 0}, {"key": "34797243", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943689138915, "ground_truth": 0}, {"key": "32154876", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.679178694076731, "ground_truth": 0}, {"key": "32154876", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619361008056, "ground_truth": 0}, {"key": "32154876", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159617497653, "ground_truth": 0}, {"key": "32154876", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102699708227, "ground_truth": 0}, {"key": "32154876", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228598399161, "ground_truth": 0}, {"key": "37962274", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7325918507716452, "ground_truth": 0}, {"key": "37962274", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666567098757, "ground_truth": 0}, {"key": "37962274", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879311791717856, "ground_truth": 0}, {"key": "37962274", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191427738485, "ground_truth": 0}, {"key": "37962274", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424279587137, "ground_truth": 0}, {"key": "35574030", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625133136139, "ground_truth": 0}, {"key": "35574030", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8856314647885764, "ground_truth": 0}, {"key": "35574030", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9304582645031229, "ground_truth": 0}, {"key": "35574030", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748623763081, "ground_truth": 0}, {"key": "35574030", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142392444707, "ground_truth": 0}, {"key": "39105949", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9246876882844692, "ground_truth": 0}, {"key": "39105949", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9299510383216255, "ground_truth": 0}, {"key": "39105949", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8879840464519766, "ground_truth": 0}, {"key": "39105949", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213760355764, "ground_truth": 0}, {"key": "39105949", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869825887956, "ground_truth": 0}, {"key": "41064322", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9289263314519216, "ground_truth": 0}, {"key": "41064322", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9319595823086445, "ground_truth": 0}, {"key": "41064322", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9473810506298018, "ground_truth": 0}, {"key": "41064322", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9566342000070935, "ground_truth": 0}, {"key": "41064322", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9314624991578814, "ground_truth": 0}, {"key": "28105101", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7549149773317678, "ground_truth": 0}, {"key": "28105101", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8210441043358697, "ground_truth": 0}, {"key": "28105101", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7956580988659201, "ground_truth": 0}, {"key": "28105101", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224228631356, "ground_truth": 0}, {"key": "28105101", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358140921279, "ground_truth": 0}, {"key": "36036068", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6723316964825298, "ground_truth": 0}, {"key": "36036068", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672280682185, "ground_truth": 0}, {"key": "36036068", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8300437771229124, "ground_truth": 0}, {"key": "36036068", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.82782814777252, "ground_truth": 0}, {"key": "36036068", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312037520451, "ground_truth": 0}, {"key": "37991460", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.803173784405891, "ground_truth": 0}, {"key": "37991460", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185776538919, "ground_truth": 0}, {"key": "37991460", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8044059131215331, "ground_truth": 0}, {"key": "37991460", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199697227891, "ground_truth": 0}, {"key": "37991460", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142480319005, "ground_truth": 0}, {"key": "38437830", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7826624769887579, "ground_truth": 0}, {"key": "38437830", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7592253960131136, "ground_truth": 0}, {"key": "38437830", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8529354746659595, "ground_truth": 0}, {"key": "38437830", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388086628307, "ground_truth": 0}, {"key": "38437830", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269253127365, "ground_truth": 0}, {"key": "36507138", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7956581005004882, "ground_truth": 0}, {"key": "36507138", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6909762776320205, "ground_truth": 0}, {"key": "36507138", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6619228605423421, "ground_truth": 0}, {"key": "36507138", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905302969067661, "ground_truth": 0}, {"key": "36507138", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445663250755, "ground_truth": 0}, {"key": "37824866", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8872045905353594, "ground_truth": 0}, {"key": "37824866", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.811676032711803, "ground_truth": 0}, {"key": "37824866", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7704647687670696, "ground_truth": 0}, {"key": "37824866", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951035064313, "ground_truth": 0}, {"key": "37824866", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918344186834, "ground_truth": 0}, {"key": "25088134", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7620701058256261, "ground_truth": 0}, {"key": "25088134", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8187367977586456, "ground_truth": 0}, {"key": "25088134", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8221891516125333, "ground_truth": 0}, {"key": "25088134", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549150113647232, "ground_truth": 0}, {"key": "25088134", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578366275797, "ground_truth": 0}, {"key": "40172531", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7704647673031649, "ground_truth": 0}, {"key": "40172531", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7634837384376711, "ground_truth": 0}, {"key": "40172531", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006920116870266, "ground_truth": 0}, {"key": "40172531", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581531631672, "ground_truth": 0}, {"key": "40172531", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.749087187960653, "ground_truth": 0}, {"key": "37035874", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7122321852503257, "ground_truth": 0}, {"key": "37035874", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7648916158508581, "ground_truth": 0}, {"key": "37035874", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592253957847381, "ground_truth": 0}, {"key": "37035874", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191343660603, "ground_truth": 0}, {"key": "37035874", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743410326089, "ground_truth": 0}, {"key": "36404465", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9563089421903082, "ground_truth": 0}, {"key": "36404465", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9676556712424788, "ground_truth": 0}, {"key": "36404465", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9623913649193897, "ground_truth": 0}, {"key": "36404465", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.977370798442991, "ground_truth": 0}, {"key": "36404465", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9746286888088643, "ground_truth": 0}, {"key": "39602052", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8529354875597634, "ground_truth": 0}, {"key": "39602052", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9196425324805797, "ground_truth": 0}, {"key": "39602052", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8807970686813403, "ground_truth": 0}, {"key": "39602052", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577680974914653, "ground_truth": 0}, {"key": "39602052", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549517561129, "ground_truth": 0}, {"key": "33792789", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6001883540553153, "ground_truth": 0}, {"key": "33792789", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5525397055803036, "ground_truth": 0}, {"key": "33792789", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7905303049624328, "ground_truth": 0}, {"key": "33792789", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197805357726, "ground_truth": 0}, {"key": "33792789", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723672252112, "ground_truth": 0}, {"key": "32776626", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6495786308884959, "ground_truth": 0}, {"key": "32776626", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8187367934910865, "ground_truth": 0}, {"key": "32776626", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6297746255101436, "ground_truth": 0}, {"key": "32776626", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033778000768, "ground_truth": 0}, {"key": "32776626", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984906162673, "ground_truth": 0}, {"key": "37195090", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445561227599, "ground_truth": 0}, {"key": "37195090", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8140528133112814, "ground_truth": 0}, {"key": "37195090", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6757645935322988, "ground_truth": 0}, {"key": "37195090", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432112579704, "ground_truth": 0}, {"key": "37195090", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786324419049, "ground_truth": 0}, {"key": "33981824", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445291897374, "ground_truth": 0}, {"key": "33981824", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6654105576331698, "ground_truth": 0}, {"key": "33981824", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5525397038984802, "ground_truth": 0}, {"key": "33981824", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293656446419, "ground_truth": 0}, {"key": "33981824", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046833109543, "ground_truth": 0}, {"key": "39569142", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7690802347766826, "ground_truth": 0}, {"key": "39569142", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8056321748252144, "ground_truth": 0}, {"key": "39569142", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8092759774154736, "ground_truth": 0}, {"key": "39569142", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575530202667, "ground_truth": 0}, {"key": "39569142", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197792115306, "ground_truth": 0}, {"key": "40268210", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7718434877931688, "ground_truth": 0}, {"key": "40268210", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6909763161201941, "ground_truth": 0}, {"key": "40268210", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8633916077160271, "ground_truth": 0}, {"key": "40268210", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587859856899, "ground_truth": 0}, {"key": "40268210", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.757794382854248, "ground_truth": 0}, {"key": "34925159", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797675215619, "ground_truth": 0}, {"key": "34925159", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7248702834072649, "ground_truth": 0}, {"key": "34925159", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7534666488165045, "ground_truth": 0}, {"key": "34925159", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.903974507356147, "ground_truth": 0}, {"key": "34925159", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357564916565, "ground_truth": 0}, {"key": "36181903", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9053223028561027, "ground_truth": 0}, {"key": "36181903", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.937668965052894, "ground_truth": 0}, {"key": "36181903", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9416541596301907, "ground_truth": 0}, {"key": "36181903", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080819017437, "ground_truth": 0}, {"key": "36181903", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105516152076, "ground_truth": 0}, {"key": "38620559", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9515039963720933, "ground_truth": 0}, {"key": "38620559", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9257686325458852, "ground_truth": 0}, {"key": "38620559", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8984105497720876, "ground_truth": 0}, {"key": "38620559", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009580464956, "ground_truth": 0}, {"key": "38620559", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755740724835, "ground_truth": 0}, {"key": "32719657", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8902942280665183, "ground_truth": 0}, {"key": "32719657", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.917893367841895, "ground_truth": 0}, {"key": "32719657", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637551023255, "ground_truth": 0}, {"key": "32719657", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711759213562, "ground_truth": 0}, {"key": "32719657", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789155844593, "ground_truth": 0}, {"key": "37530914", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6513548628482239, "ground_truth": 0}, {"key": "37530914", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5156199305428257, "ground_truth": 0}, {"key": "37530914", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.523420369863903, "ground_truth": 0}, {"key": "37530914", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254160729925, "ground_truth": 0}, {"key": "37530914", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318419099337, "ground_truth": 0}, {"key": "33306933", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303325608559, "ground_truth": 0}, {"key": "33306933", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8879840379965083, "ground_truth": 0}, {"key": "33306933", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9273632924225846, "ground_truth": 0}, {"key": "33306933", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354961135135, "ground_truth": 0}, {"key": "33306933", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105453943900004, "ground_truth": 0}, {"key": "33837212", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.783988458772015, "ground_truth": 0}, {"key": "33837212", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680106867875, "ground_truth": 0}, {"key": "33837212", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7648916088219259, "ground_truth": 0}, {"key": "33837212", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545571269272, "ground_truth": 0}, {"key": "33837212", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.778649322821144, "ground_truth": 0}, {"key": "40945179", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228532530104, "ground_truth": 0}, {"key": "40945179", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059404264984, "ground_truth": 0}, {"key": "40945179", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.845942441428205, "ground_truth": 0}, {"key": "40945179", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366569372961, "ground_truth": 0}, {"key": "40945179", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338506880432, "ground_truth": 0}, {"key": "34152358", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6566582639382543, "ground_truth": 0}, {"key": "34152358", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5794004300155003, "ground_truth": 0}, {"key": "34152358", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4493925895805129, "ground_truth": 0}, {"key": "34152358", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165294933594, "ground_truth": 0}, {"key": "34152358", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.635222447618525, "ground_truth": 0}, {"key": "34136541", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.902609599294636, "ground_truth": 0}, {"key": "34136541", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8643104521206411, "ground_truth": 0}, {"key": "34136541", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8300437673474554, "ground_truth": 0}, {"key": "34136541", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026096012990925, "ground_truth": 0}, {"key": "34136541", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816148999597844, "ground_truth": 0}, {"key": "37469603", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7772998673380871, "ground_truth": 0}, {"key": "37469603", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7879311997148823, "ground_truth": 0}, {"key": "37469603", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.812867325021373, "ground_truth": 0}, {"key": "37469603", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063890059962, "ground_truth": 0}, {"key": "37469603", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068857442022, "ground_truth": 0}, {"key": "37353611", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9722043776198195, "ground_truth": 0}, {"key": "37353611", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9465966730345172, "ground_truth": 0}, {"key": "37353611", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9190632874900139, "ground_truth": 0}, {"key": "37353611", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037287242285, "ground_truth": 0}, {"key": "37353611", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9092645080912206, "ground_truth": 0}, {"key": "37211649", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6513548944009888, "ground_truth": 0}, {"key": "37211649", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526384446759, "ground_truth": 0}, {"key": "37211649", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210441204731326, "ground_truth": 0}, {"key": "37211649", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943723817487, "ground_truth": 0}, {"key": "37211649", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.734119531637964, "ground_truth": 0}, {"key": "37320976", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7074047218223609, "ground_truth": 0}, {"key": "37320976", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.697608938867278, "ground_truth": 0}, {"key": "37320976", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7386690732645379, "ground_truth": 0}, {"key": "37320976", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253735993546, "ground_truth": 0}, {"key": "37320976", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056236187258, "ground_truth": 0}, {"key": "34492412", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.924687694583616, "ground_truth": 0}, {"key": "34492412", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8459424438254626, "ground_truth": 0}, {"key": "34492412", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9032942227666608, "ground_truth": 0}, {"key": "34492412", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.899827779596734, "ground_truth": 0}, {"key": "34492412", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338456198284, "ground_truth": 0}, {"key": "36655016", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9412234382444216, "ground_truth": 0}, {"key": "36655016", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9496693660501265, "ground_truth": 0}, {"key": "36655016", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9343951550376371, "ground_truth": 0}, {"key": "36655016", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.966155964477551, "ground_truth": 0}, {"key": "36655016", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012634171157, "ground_truth": 0}, {"key": "35220773", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8661325184636253, "ground_truth": 0}, {"key": "35220773", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7620701264696343, "ground_truth": 0}, {"key": "35220773", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8624675428157078, "ground_truth": 0}, {"key": "35220773", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846340723959, "ground_truth": 0}, {"key": "35220773", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942030428485, "ground_truth": 0}, {"key": "31569808", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159549958077, "ground_truth": 0}, {"key": "31569808", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7505527675573389, "ground_truth": 0}, {"key": "31569808", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6531269201621634, "ground_truth": 0}, {"key": "31569808", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735086742173, "ground_truth": 0}, {"key": "31569808", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.77046478729201, "ground_truth": 0}, {"key": "37696256", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185943966754561, "ground_truth": 0}, {"key": "37696256", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267118015568561, "ground_truth": 0}, {"key": "37696256", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7969253689126121, "ground_truth": 0}, {"key": "37696256", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059122719424, "ground_truth": 0}, {"key": "37696256", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916137468587, "ground_truth": 0}, {"key": "36874328", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267118095063506, "ground_truth": 0}, {"key": "36874328", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8489722105064391, "ground_truth": 0}, {"key": "36874328", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8652240871763596, "ground_truth": 0}, {"key": "36874328", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361618115032, "ground_truth": 0}, {"key": "36874328", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923147626717, "ground_truth": 0}, {"key": "24532377", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8140528154358047, "ground_truth": 0}, {"key": "24532377", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744691899901, "ground_truth": 0}, {"key": "24532377", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.851952786313534, "ground_truth": 0}, {"key": "24532377", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933169333412, "ground_truth": 0}, {"key": "24532377", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933361290532, "ground_truth": 0}, {"key": "39560618", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159445649037, "ground_truth": 0}, {"key": "39560618", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8255897115683741, "ground_truth": 0}, {"key": "39560618", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324910930231, "ground_truth": 0}, {"key": "39560618", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312051348136, "ground_truth": 0}, {"key": "39560618", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382130174157, "ground_truth": 0}, {"key": "34922693", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.3867634456046159, "ground_truth": 0}, {"key": "34922693", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4863315317875518, "ground_truth": 0}, {"key": "34922693", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5019531062834588, "ground_truth": 0}, {"key": "34922693", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.33982761687723906, "ground_truth": 0}, {"key": "34922693", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754067429270427, "ground_truth": 0}, {"key": "33629577", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6584175003915645, "ground_truth": 0}, {"key": "33629577", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6992544105151085, "ground_truth": 0}, {"key": "33629577", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344068799082521, "ground_truth": 0}, {"key": "33629577", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228669559295, "ground_truth": 0}, {"key": "33629577", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431944349294, "ground_truth": 0}, {"key": "32284359", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7371581808023282, "ground_truth": 0}, {"key": "32284359", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7057850295683813, "ground_truth": 0}, {"key": "32284359", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7217432344518424, "ground_truth": 0}, {"key": "32284359", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646216849448, "ground_truth": 0}, {"key": "32284359", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.684264030405894, "ground_truth": 0}, {"key": "28082962", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7461390142767069, "ground_truth": 0}, {"key": "28082962", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5851011797287692, "ground_truth": 0}, {"key": "28082962", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7676898537674918, "ground_truth": 0}, {"key": "28082962", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338511599906, "ground_truth": 0}, {"key": "28082962", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352919492013, "ground_truth": 0}, {"key": "24796803", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9118099650015533, "ground_truth": 0}, {"key": "24796803", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9500414751784778, "ground_truth": 0}, {"key": "24796803", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8774767843721352, "ground_truth": 0}, {"key": "24796803", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759622587904, "ground_truth": 0}, {"key": "24796803", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037297640484, "ground_truth": 0}, {"key": "35466150", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142454329433, "ground_truth": 0}, {"key": "35466150", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8933093962529898, "ground_truth": 0}, {"key": "35466150", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9504109792328481, "ground_truth": 0}, {"key": "35466150", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.874077238608128, "ground_truth": 0}, {"key": "35466150", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145701770714, "ground_truth": 0}, {"key": "35754289", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8940517233803144, "ground_truth": 0}, {"key": "35754289", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9019206698197417, "ground_truth": 0}, {"key": "35754289", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587958395857, "ground_truth": 0}, {"key": "35754289", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835389620263, "ground_truth": 0}, {"key": "35754289", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445521739823, "ground_truth": 0}, {"key": "36678662", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9643214471195678, "ground_truth": 0}, {"key": "36678662", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9612438042919095, "ground_truth": 0}, {"key": "36678662", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392950770236, "ground_truth": 0}, {"key": "36678662", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9525741284872744, "ground_truth": 0}, {"key": "36678662", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346212415237, "ground_truth": 0}, {"key": "35399671", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9257686325051179, "ground_truth": 0}, {"key": "35399671", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9219218333005453, "ground_truth": 0}, {"key": "35399671", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8955226694814039, "ground_truth": 0}, {"key": "35399671", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009552159565, "ground_truth": 0}, {"key": "35399671", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.876634387375859, "ground_truth": 0}, {"key": "36888180", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.871474860099978, "ground_truth": 0}, {"key": "36888180", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8255897096457069, "ground_truth": 0}, {"key": "36888180", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8386797677113144, "ground_truth": 0}, {"key": "36888180", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519527998377181, "ground_truth": 0}, {"key": "36888180", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105453926421407, "ground_truth": 0}, {"key": "28061069", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6548947212209062, "ground_truth": 0}, {"key": "28061069", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799929109168623, "ground_truth": 0}, {"key": "28061069", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210595135626, "ground_truth": 0}, {"key": "28061069", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506631751584, "ground_truth": 0}, {"key": "28061069", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251160064919, "ground_truth": 0}, {"key": "22259982", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303036133254, "ground_truth": 0}, {"key": "22259982", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.749087219657706, "ground_truth": 0}, {"key": "22259982", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7264256051806256, "ground_truth": 0}, {"key": "22259982", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665944132746, "ground_truth": 0}, {"key": "22259982", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358115923002, "ground_truth": 0}, {"key": "34026805", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8322366576235091, "ground_truth": 0}, {"key": "34026805", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8791467709024545, "ground_truth": 0}, {"key": "34026805", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.877476796979549, "ground_truth": 0}, {"key": "34026805", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354822881197, "ground_truth": 0}, {"key": "34026805", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297877826317, "ground_truth": 0}, {"key": "36713809", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7356416299365949, "ground_truth": 0}, {"key": "36713809", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8056321762629451, "ground_truth": 0}, {"key": "36713809", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199575216006, "ground_truth": 0}, {"key": "36713809", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358246619466, "ground_truth": 0}, {"key": "36713809", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876964683445, "ground_truth": 0}, {"key": "39726411", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6495786001153048, "ground_truth": 0}, {"key": "39726411", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7690802369986229, "ground_truth": 0}, {"key": "39726411", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6261241636461632, "ground_truth": 0}, {"key": "39726411", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082639487512, "ground_truth": 0}, {"key": "39726411", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646064464189, "ground_truth": 0}, {"key": "37069841", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.866132508544006, "ground_truth": 0}, {"key": "37069841", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8991213706975216, "ground_truth": 0}, {"key": "37069841", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215348910549, "ground_truth": 0}, {"key": "37069841", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430599192478, "ground_truth": 0}, {"key": "37069841", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745239642683, "ground_truth": 0}, {"key": "38894693", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6636689424285318, "ground_truth": 0}, {"key": "38894693", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.787931192244068, "ground_truth": 0}, {"key": "38894693", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.726425628067101, "ground_truth": 0}, {"key": "38894693", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526198827254, "ground_truth": 0}, {"key": "38894693", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884659482295, "ground_truth": 0}, {"key": "33946032", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9755769108963976, "ground_truth": 0}, {"key": "33946032", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9606574986516458, "ground_truth": 0}, {"key": "33946032", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.955981353081313, "ground_truth": 0}, {"key": "33946032", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9600626876976713, "ground_truth": 0}, {"key": "33946032", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.960951703397902, "ground_truth": 0}, {"key": "39035311", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9420819137303668, "ground_truth": 0}, {"key": "39035311", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9473810480335373, "ground_truth": 0}, {"key": "39035311", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9348724537055705, "ground_truth": 0}, {"key": "39035311", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952986806609, "ground_truth": 0}, {"key": "39035311", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582573498684, "ground_truth": 0}, {"key": "27680038", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6566582838761499, "ground_truth": 0}, {"key": "27680038", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6531269318624086, "ground_truth": 0}, {"key": "27680038", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6020615940769967, "ground_truth": 0}, {"key": "27680038", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241893617983, "ground_truth": 0}, {"key": "27680038", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203663753115, "ground_truth": 0}, {"key": "36901907", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8998277755298516, "ground_truth": 0}, {"key": "36901907", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8044059041484355, "ground_truth": 0}, {"key": "36901907", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8128673124505119, "ground_truth": 0}, {"key": "36901907", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866227974557559, "ground_truth": 0}, {"key": "36901907", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070037889176, "ground_truth": 0}, {"key": "21530542", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5486734971921321, "ground_truth": 0}, {"key": "21530542", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.747615958561555, "ground_truth": 0}, {"key": "21530542", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6406358587697676, "ground_truth": 0}, {"key": "21530542", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251248590729, "ground_truth": 0}, {"key": "21530542", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585498568357, "ground_truth": 0}, {"key": "38192532", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9441768564579549, "ground_truth": 0}, {"key": "38192532", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9304582610971421, "ground_truth": 0}, {"key": "38192532", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9161096132541251, "ground_truth": 0}, {"key": "38192532", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284088008885222, "ground_truth": 0}, {"key": "38192532", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505370520287, "ground_truth": 0}, {"key": "34102400", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4551985816167797, "ground_truth": 0}, {"key": "34102400", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4746311989845718, "ground_truth": 0}, {"key": "34102400", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5370413861053821, "ground_truth": 0}, {"key": "34102400", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059958925171287, "ground_truth": 0}, {"key": "34102400", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792179961158, "ground_truth": 0}, {"key": "36133399", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8459424323887942, "ground_truth": 0}, {"key": "36133399", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681002368184, "ground_truth": 0}, {"key": "36133399", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8539127465024542, "ground_truth": 0}, {"key": "36133399", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343813035393, "ground_truth": 0}, {"key": "36133399", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759875523706, "ground_truth": 0}, {"key": "34314544", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7122321827481123, "ground_truth": 0}, {"key": "34314544", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7826624956180663, "ground_truth": 0}, {"key": "34314544", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6943026820399255, "ground_truth": 0}, {"key": "34314544", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125795036464, "ground_truth": 0}, {"key": "34314544", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307438924268, "ground_truth": 0}, {"key": "33460074", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8714748734185518, "ground_truth": 0}, {"key": "33460074", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.828938811965313, "ground_truth": 0}, {"key": "33460074", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.815232510459497, "ground_truth": 0}, {"key": "33460074", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.737158174717316, "ground_truth": 0}, {"key": "33460074", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036294259752, "ground_truth": 0}, {"key": "36191495", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382079250469, "ground_truth": 0}, {"key": "36191495", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9059898176023983, "ground_truth": 0}, {"key": "36191495", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.782662486385108, "ground_truth": 0}, {"key": "36191495", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797627959285, "ground_truth": 0}, {"key": "36191495", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637540312606, "ground_truth": 0}, {"key": "39532668", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9304582543049001, "ground_truth": 0}, {"key": "39532668", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9039745178491462, "ground_truth": 0}, {"key": "39532668", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8469578405478361, "ground_truth": 0}, {"key": "39532668", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.828938815511231, "ground_truth": 0}, {"key": "39532668", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.844921534628073, "ground_truth": 0}, {"key": "20328247", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5078118707336665, "ground_truth": 0}, {"key": "20328247", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4610167927088429, "ground_truth": 0}, {"key": "20328247", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5660185273161811, "ground_truth": 0}, {"key": "20328247", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878857761939, "ground_truth": 0}, {"key": "20328247", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982194156016, "ground_truth": 0}, {"key": "39112675", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.586996442401673, "ground_truth": 0}, {"key": "39112675", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.665410550591435, "ground_truth": 0}, {"key": "39112675", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592254085212948, "ground_truth": 0}, {"key": "39112675", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740405268039, "ground_truth": 0}, {"key": "39112675", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118806430738, "ground_truth": 0}, {"key": "31620300", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666624157479, "ground_truth": 0}, {"key": "31620300", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7170118559376223, "ground_truth": 0}, {"key": "31620300", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592253968875436, "ground_truth": 0}, {"key": "31620300", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680193179804, "ground_truth": 0}, {"key": "31620300", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666486587364, "ground_truth": 0}, {"key": "37518509", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7662936464240533, "ground_truth": 0}, {"key": "37518509", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.646013723138853, "ground_truth": 0}, {"key": "37518509", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6206216231367642, "ground_truth": 0}, {"key": "37518509", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102680892532, "ground_truth": 0}, {"key": "37518509", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224521701803, "ground_truth": 0}, {"key": "35454095", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163518875751, "ground_truth": 0}, {"key": "35454095", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9142907351273979, "ground_truth": 0}, {"key": "35454095", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8175744717081694, "ground_truth": 0}, {"key": "35454095", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300637077885, "ground_truth": 0}, {"key": "35454095", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575940772491, "ground_truth": 0}, {"key": "38542788", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9465966675288194, "ground_truth": 0}, {"key": "38542788", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9246876920535838, "ground_truth": 0}, {"key": "38542788", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9358173548347752, "ground_truth": 0}, {"key": "38542788", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067208694232, "ground_truth": 0}, {"key": "38542788", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9518632324172688, "ground_truth": 0}, {"key": "23944937", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6206216284226934, "ground_truth": 0}, {"key": "23944937", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5486735231315802, "ground_truth": 0}, {"key": "23944937", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5945512541025424, "ground_truth": 0}, {"key": "23944937", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804687590515984, "ground_truth": 0}, {"key": "23944937", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224335073362, "ground_truth": 0}, {"key": "31753944", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5964331422248718, "ground_truth": 0}, {"key": "31753944", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7074046975832713, "ground_truth": 0}, {"key": "31753944", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5409238633590223, "ground_truth": 0}, {"key": "31753944", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324556705063, "ground_truth": 0}, {"key": "31753944", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740028278758, "ground_truth": 0}, {"key": "35527214", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8289388137184102, "ground_truth": 0}, {"key": "35527214", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8300437704585295, "ground_truth": 0}, {"key": "35527214", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7662936373383142, "ground_truth": 0}, {"key": "35527214", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424356268985, "ground_truth": 0}, {"key": "35527214", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185899661267, "ground_truth": 0}, {"key": "40400404", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9635062340621704, "ground_truth": 0}, {"key": "40400404", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9504109780121959, "ground_truth": 0}, {"key": "40400404", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9651191112833177, "ground_truth": 0}, {"key": "40400404", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.946990225992519, "ground_truth": 0}, {"key": "40400404", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9686195675357024, "ground_truth": 0}, {"key": "21713119", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8791467771118754, "ground_truth": 0}, {"key": "21713119", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6992544251039892, "ground_truth": 0}, {"key": "21713119", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8947894597020813, "ground_truth": 0}, {"key": "21713119", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956580984125777, "ground_truth": 0}, {"key": "21713119", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.857768106787927, "ground_truth": 0}, {"key": "28730678", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7279754619456155, "ground_truth": 0}, {"key": "28730678", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8539127420739423, "ground_truth": 0}, {"key": "28730678", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339834715744, "ground_truth": 0}, {"key": "28730678", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163647539874, "ground_truth": 0}, {"key": "28730678", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085802310478, "ground_truth": 0}, {"key": "36823733", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887587846535638, "ground_truth": 0}, {"key": "36823733", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303116671883, "ground_truth": 0}, {"key": "36823733", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.822189124165216, "ground_truth": 0}, {"key": "36823733", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835471501134, "ground_truth": 0}, {"key": "36823733", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505405512114, "ground_truth": 0}, {"key": "35988862", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6531269183247169, "ground_truth": 0}, {"key": "35988862", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7549150120457426, "ground_truth": 0}, {"key": "35988862", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872168135765, "ground_truth": 0}, {"key": "35988862", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163773948789, "ground_truth": 0}, {"key": "35988862", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762599011682, "ground_truth": 0}, {"key": "40499665", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9536217943901676, "ground_truth": 0}, {"key": "40499665", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9532750397040475, "ground_truth": 0}, {"key": "40499665", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9441768560166443, "ground_truth": 0}, {"key": "40499665", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9546474177520005, "ground_truth": 0}, {"key": "40499665", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576096883247, "ground_truth": 0}, {"key": "32829820", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210441218805379, "ground_truth": 0}, {"key": "32829820", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5869964639966596, "ground_truth": 0}, {"key": "32829820", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6723317212358019, "ground_truth": 0}, {"key": "32829820", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432240323859, "ground_truth": 0}, {"key": "32829820", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740279303857, "ground_truth": 0}, {"key": "20583553", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.48242908238902965, "ground_truth": 0}, {"key": "20583553", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.35577488963099524, "ground_truth": 0}, {"key": "20583553", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6242935553269134, "ground_truth": 0}, {"key": "20583553", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734678449664, "ground_truth": 0}, {"key": "20583553", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.594551269501049, "ground_truth": 0}, {"key": "30501550", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9407897497347233, "ground_truth": 0}, {"key": "30501550", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9278878056090503, "ground_truth": 0}, {"key": "30501550", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9358173542859962, "ground_truth": 0}, {"key": "30501550", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9755769092772617, "ground_truth": 0}, {"key": "30501550", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9343951604136904, "ground_truth": 0}, {"key": "38755897", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.744656365119555, "ground_truth": 0}, {"key": "38755897", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.812867300688426, "ground_truth": 0}, {"key": "38755897", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8529354757564559, "ground_truth": 0}, {"key": "38755897", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527690406042, "ground_truth": 0}, {"key": "38755897", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677563352017, "ground_truth": 0}, {"key": "35507201", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8418256455443365, "ground_truth": 0}, {"key": "35507201", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8749346160436156, "ground_truth": 0}, {"key": "35507201", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7416740114814081, "ground_truth": 0}, {"key": "35507201", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419907467372, "ground_truth": 0}, {"key": "35507201", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.836554533815577, "ground_truth": 0}, {"key": "36453511", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675471686338, "ground_truth": 0}, {"key": "36453511", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8311430398183145, "ground_truth": 0}, {"key": "36453511", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528139623223, "ground_truth": 0}, {"key": "36453511", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9105453982477971, "ground_truth": 0}, {"key": "36453511", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.902609602077698, "ground_truth": 0}, {"key": "38066835", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9039745154641059, "ground_truth": 0}, {"key": "38066835", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9167080740027331, "ground_truth": 0}, {"key": "38066835", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148300473337, "ground_truth": 0}, {"key": "38066835", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.91243615432771, "ground_truth": 0}, {"key": "38066835", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9207896794961112, "ground_truth": 0}, {"key": "39697181", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6442251081923619, "ground_truth": 0}, {"key": "39697181", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300660026278, "ground_truth": 0}, {"key": "39697181", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7826624907850613, "ground_truth": 0}, {"key": "39697181", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105729718893, "ground_truth": 0}, {"key": "39697181", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004166179882, "ground_truth": 0}, {"key": "21820893", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159701536236, "ground_truth": 0}, {"key": "21820893", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7634837624430202, "ground_truth": 0}, {"key": "21820893", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.827828159785948, "ground_truth": 0}, {"key": "21820893", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437649914599, "ground_truth": 0}, {"key": "21820893", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867945696324, "ground_truth": 0}, {"key": "40519933", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.879146768968897, "ground_truth": 0}, {"key": "40519933", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303265948974, "ground_truth": 0}, {"key": "40519933", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.861538208219452, "ground_truth": 0}, {"key": "40519933", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277804591482, "ground_truth": 0}, {"key": "40519933", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797721936646, "ground_truth": 0}, {"key": "30446033", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.85585114208403, "ground_truth": 0}, {"key": "30446033", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.833324605165918, "ground_truth": 0}, {"key": "30446033", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9136765257611051, "ground_truth": 0}, {"key": "30446033", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357548428459, "ground_truth": 0}, {"key": "30446033", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681169831352, "ground_truth": 0}, {"key": "40216291", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8322366617117302, "ground_truth": 0}, {"key": "40216291", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145858938317, "ground_truth": 0}, {"key": "40216291", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9136765221403995, "ground_truth": 0}, {"key": "40216291", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338455511413, "ground_truth": 0}, {"key": "40216291", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942266250979, "ground_truth": 0}, {"key": "33479118", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6893056114175875, "ground_truth": 0}, {"key": "33479118", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6370307767439235, "ground_truth": 0}, {"key": "33479118", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7620700946933099, "ground_truth": 0}, {"key": "33479118", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324918147025, "ground_truth": 0}, {"key": "33479118", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251030872456, "ground_truth": 0}, {"key": "22297373", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892337057643237, "ground_truth": 0}, {"key": "22297373", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680187360977, "ground_truth": 0}, {"key": "22297373", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118938456739, "ground_truth": 0}, {"key": "22297373", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.738669075530869, "ground_truth": 0}, {"key": "22297373", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224191212428, "ground_truth": 0}, {"key": "36463668", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601369272024, "ground_truth": 0}, {"key": "36463668", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619366122974, "ground_truth": 0}, {"key": "36463668", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7759445446001333, "ground_truth": 0}, {"key": "36463668", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033636112249, "ground_truth": 0}, {"key": "36463668", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526268262177, "ground_truth": 0}, {"key": "35264615", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6842640439721059, "ground_truth": 0}, {"key": "35264615", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672175117414, "ground_truth": 0}, {"key": "35264615", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6424324724835202, "ground_truth": 0}, {"key": "35264615", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.753466647305359, "ground_truth": 0}, {"key": "35264615", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837548832316, "ground_truth": 0}, {"key": "39898482", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8652240874370073, "ground_truth": 0}, {"key": "39898482", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9582261154346826, "ground_truth": 0}, {"key": "39898482", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9339146112321192, "ground_truth": 0}, {"key": "39898482", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823409591304, "ground_truth": 0}, {"key": "39898482", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.944176860418225, "ground_truth": 0}, {"key": "37228721", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8652240749909293, "ground_truth": 0}, {"key": "37228721", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185860177343, "ground_truth": 0}, {"key": "37228721", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8469578614527388, "ground_truth": 0}, {"key": "37228721", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437610727376, "ground_truth": 0}, {"key": "37228721", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.889528863746342, "ground_truth": 0}, {"key": "24535799", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9821512621146764, "ground_truth": 0}, {"key": "24535799", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9815951087597544, "ground_truth": 0}, {"key": "24535799", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9736446508012008, "ground_truth": 0}, {"key": "24535799", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9597620560399859, "ground_truth": 0}, {"key": "24535799", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9559813469243079, "ground_truth": 0}, {"key": "35177759", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8244619370534382, "ground_truth": 0}, {"key": "35177759", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7943849513550878, "ground_truth": 0}, {"key": "35177759", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8221891270342879, "ground_truth": 0}, {"key": "35177759", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8955226679935732, "ground_truth": 0}, {"key": "35177759", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037286637456, "ground_truth": 0}, {"key": "34364829", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7606506515238916, "ground_truth": 0}, {"key": "34364829", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.732591847082617, "ground_truth": 0}, {"key": "34364829", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8056322014395625, "ground_truth": 0}, {"key": "34364829", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936411332247, "ground_truth": 0}, {"key": "34364829", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163759810337, "ground_truth": 0}, {"key": "38090732", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8333245912933022, "ground_truth": 0}, {"key": "38090732", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7759445263671018, "ground_truth": 0}, {"key": "38090732", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8643104579015445, "ground_truth": 0}, {"key": "38090732", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513726526131, "ground_truth": 0}, {"key": "38090732", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070037053717, "ground_truth": 0}, {"key": "30651479", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7690802558041011, "ground_truth": 0}, {"key": "30651479", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9124361645888536, "ground_truth": 0}, {"key": "30651479", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8365545675633093, "ground_truth": 0}, {"key": "30651479", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920058835845, "ground_truth": 0}, {"key": "30651479", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883611808545, "ground_truth": 0}, {"key": "39380921", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7690802509302956, "ground_truth": 0}, {"key": "39380921", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7461389853115803, "ground_truth": 0}, {"key": "39380921", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872183504937, "ground_truth": 0}, {"key": "39380921", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253651136642, "ground_truth": 0}, {"key": "39380921", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581539014415, "ground_truth": 0}, {"key": "39037490", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.42441199962429443, "ground_truth": 0}, {"key": "39037490", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.46684559101950485, "ground_truth": 0}, {"key": "39037490", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4921881389398418, "ground_truth": 0}, {"key": "39037490", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352860229709, "ground_truth": 0}, {"key": "39037490", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269185869881, "ground_truth": 0}, {"key": "35917499", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.808067217207421, "ground_truth": 0}, {"key": "35917499", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8732148197763925, "ground_truth": 0}, {"key": "35917499", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9079671336523581, "ground_truth": 0}, {"key": "35917499", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942275980588, "ground_truth": 0}, {"key": "35917499", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576127777443, "ground_truth": 0}, {"key": "34908073", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7853085684532845, "ground_truth": 0}, {"key": "34908073", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199668928974, "ground_truth": 0}, {"key": "34908073", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879311965281731, "ground_truth": 0}, {"key": "34908073", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089366077446, "ground_truth": 0}, {"key": "34908073", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759708641453, "ground_truth": 0}, {"key": "36344759", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9385759602804897, "ground_truth": 0}, {"key": "36344759", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.854884645650029, "ground_truth": 0}, {"key": "36344759", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8661325066333394, "ground_truth": 0}, {"key": "36344759", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009603192991, "ground_truth": 0}, {"key": "36344759", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.865224085497663, "ground_truth": 0}, {"key": "39984637", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7325918340130793, "ground_truth": 0}, {"key": "39984637", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7969253746106106, "ground_truth": 0}, {"key": "39984637", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5832033233574031, "ground_truth": 0}, {"key": "39984637", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185287878347, "ground_truth": 0}, {"key": "39984637", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224408018724, "ground_truth": 0}, {"key": "17917326", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.854884632905468, "ground_truth": 0}, {"key": "17917326", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.741674023164158, "ground_truth": 0}, {"key": "17917326", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9118099539060531, "ground_truth": 0}, {"key": "17917326", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898485338186, "ground_truth": 0}, {"key": "17917326", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601332419446, "ground_truth": 0}, {"key": "32193638", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8019358242778947, "ground_truth": 0}, {"key": "32193638", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8774767959027407, "ground_truth": 0}, {"key": "32193638", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7310585711828367, "ground_truth": 0}, {"key": "32193638", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690978711672, "ground_truth": 0}, {"key": "32193638", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435027413036, "ground_truth": 0}, {"key": "34564692", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8080672142990432, "ground_truth": 0}, {"key": "34564692", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7310585748072997, "ground_truth": 0}, {"key": "34564692", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339765354208, "ground_truth": 0}, {"key": "34564692", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437732312876, "ground_truth": 0}, {"key": "34564692", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125825141103, "ground_truth": 0}, {"key": "39329284", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9864678509963739, "ground_truth": 0}, {"key": "39329284", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.957277801045126, "ground_truth": 0}, {"key": "39329284", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9761291640756252, "ground_truth": 0}, {"key": "39329284", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9750122060998908, "ground_truth": 0}, {"key": "39329284", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9939964045809722, "ground_truth": 0}, {"key": "37438541", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976089153514522, "ground_truth": 0}, {"key": "37438541", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6909763116144291, "ground_truth": 0}, {"key": "37438541", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6548947337746781, "ground_truth": 0}, {"key": "37438541", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.644225110506426, "ground_truth": 0}, {"key": "37438541", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983122074660783, "ground_truth": 0}, {"key": "34652757", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9224823427562532, "ground_truth": 0}, {"key": "34652757", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.895522682819783, "ground_truth": 0}, {"key": "34652757", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9019206768295622, "ground_truth": 0}, {"key": "34652757", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053223073856235, "ground_truth": 0}, {"key": "34652757", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.891054958224342, "ground_truth": 0}, {"key": "31361004", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7201715117845834, "ground_truth": 0}, {"key": "31361004", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7648916151904394, "ground_truth": 0}, {"key": "31361004", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9362850079160441, "ground_truth": 0}, {"key": "31361004", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314637427193, "ground_truth": 0}, {"key": "31361004", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357431518199, "ground_truth": 0}, {"key": "26150727", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6513548440315201, "ground_truth": 0}, {"key": "26150727", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6688802820407973, "ground_truth": 0}, {"key": "26150727", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5717666113093821, "ground_truth": 0}, {"key": "26150727", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948268598463, "ground_truth": 0}, {"key": "26150727", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102557167447, "ground_truth": 0}, {"key": "36997402", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281639900177, "ground_truth": 0}, {"key": "36997402", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9005297914870667, "ground_truth": 0}, {"key": "36997402", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9032942102473482, "ground_truth": 0}, {"key": "36997402", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583425140353, "ground_truth": 0}, {"key": "36997402", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339575650148, "ground_truth": 0}, {"key": "37430643", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6224593320020739, "ground_truth": 0}, {"key": "37430643", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7122321899540467, "ground_truth": 0}, {"key": "37430643", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118813945727, "ground_truth": 0}, {"key": "37430643", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504787642064, "ground_truth": 0}, {"key": "37430643", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358286953321, "ground_truth": 0}, {"key": "36964631", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8539127672543243, "ground_truth": 0}, {"key": "36964631", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8791467730777949, "ground_truth": 0}, {"key": "36964631", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8962513646336078, "ground_truth": 0}, {"key": "36964631", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9319595790787171, "ground_truth": 0}, {"key": "36964631", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894604096839, "ground_truth": 0}, {"key": "35502013", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7634837572818268, "ground_truth": 0}, {"key": "35502013", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185943916715475, "ground_truth": 0}, {"key": "35502013", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6206216402519256, "ground_truth": 0}, {"key": "35502013", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281430982297, "ground_truth": 0}, {"key": "35502013", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920005842613, "ground_truth": 0}, {"key": "33987664", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.860603627817375, "ground_truth": 0}, {"key": "33987664", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9105453980202041, "ground_truth": 0}, {"key": "33987664", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.897695283901928, "ground_truth": 0}, {"key": "33987664", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145692626206, "ground_truth": 0}, {"key": "33987664", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942307053017, "ground_truth": 0}, {"key": "35203721", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6926419603219688, "ground_truth": 0}, {"key": "35203721", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008947974354575, "ground_truth": 0}, {"key": "35203721", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7008947910920177, "ground_truth": 0}, {"key": "35203721", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136905364878, "ground_truth": 0}, {"key": "35203721", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105848802834, "ground_truth": 0}, {"key": "39028348", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431680135112395, "ground_truth": 0}, {"key": "39028348", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7217432181719443, "ground_truth": 0}, {"key": "39028348", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8164063922922835, "ground_truth": 0}, {"key": "39028348", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681055118659, "ground_truth": 0}, {"key": "39028348", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.774583375345353, "ground_truth": 0}, {"key": "37459383", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8732148309983, "ground_truth": 0}, {"key": "37459383", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8044059250010576, "ground_truth": 0}, {"key": "37459383", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528129597155, "ground_truth": 0}, {"key": "37459383", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894609404186, "ground_truth": 0}, {"key": "37459383", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711911533376, "ground_truth": 0}, {"key": "34020070", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104789113670402, "ground_truth": 0}, {"key": "34020070", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.826711788905853, "ground_truth": 0}, {"key": "34020070", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9039745204993458, "ground_truth": 0}, {"key": "34020070", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267797723123, "ground_truth": 0}, {"key": "34020070", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117866490759, "ground_truth": 0}, {"key": "35176615", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8832359938621984, "ground_truth": 0}, {"key": "35176615", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9019206736984542, "ground_truth": 0}, {"key": "35176615", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.917302659407487, "ground_truth": 0}, {"key": "35176615", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127611437148, "ground_truth": 0}, {"key": "35176615", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.906653120751368, "ground_truth": 0}, {"key": "33296389", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7325918422739531, "ground_truth": 0}, {"key": "33296389", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6442251356662719, "ground_truth": 0}, {"key": "33296389", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8509647010699705, "ground_truth": 0}, {"key": "33296389", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059461698698, "ground_truth": 0}, {"key": "33296389", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680190353402, "ground_truth": 0}, {"key": "35399504", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8766343793878119, "ground_truth": 0}, {"key": "35399504", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9099070026019443, "ground_truth": 0}, {"key": "35399504", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8864204091507313, "ground_truth": 0}, {"key": "35399504", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.916708084694152, "ground_truth": 0}, {"key": "35399504", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274100037206, "ground_truth": 0}, {"key": "34807886", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7446563310615797, "ground_truth": 0}, {"key": "34807886", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6224593329515982, "ground_truth": 0}, {"key": "34807886", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8832359893667869, "ground_truth": 0}, {"key": "34807886", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059281451892, "ground_truth": 0}, {"key": "34807886", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593321815836, "ground_truth": 0}, {"key": "37629813", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7090191231368674, "ground_truth": 0}, {"key": "37629813", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.787931201671393, "ground_truth": 0}, {"key": "37629813", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7279754331781966, "ground_truth": 0}, {"key": "37629813", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549548493794, "ground_truth": 0}, {"key": "37629813", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935338872648, "ground_truth": 0}, {"key": "28084389", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7676898593719046, "ground_truth": 0}, {"key": "28084389", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7994423141434905, "ground_truth": 0}, {"key": "28084389", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267117945087996, "ground_truth": 0}, {"key": "28084389", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437655739056, "ground_truth": 0}, {"key": "28084389", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283915866423, "ground_truth": 0}, {"key": "35391734", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9118099569888688, "ground_truth": 0}, {"key": "35391734", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9324533056300388, "ground_truth": 0}, {"key": "35391734", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9124361527612508, "ground_truth": 0}, {"key": "35391734", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352820261896, "ground_truth": 0}, {"key": "35391734", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9403530605165603, "ground_truth": 0}, {"key": "40214591", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382025365808, "ground_truth": 0}, {"key": "40214591", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.870597263973277, "ground_truth": 0}, {"key": "40214591", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872122307227, "ground_truth": 0}, {"key": "40214591", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.887984044197615, "ground_truth": 0}, {"key": "40214591", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145685570725, "ground_truth": 0}, {"key": "26283171", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.874077235090702, "ground_truth": 0}, {"key": "26283171", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9425067226524859, "ground_truth": 0}, {"key": "26283171", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8872045976633515, "ground_truth": 0}, {"key": "26283171", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204062865833, "ground_truth": 0}, {"key": "26283171", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846266232243, "ground_truth": 0}, {"key": "37084030", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4765796382441689, "ground_truth": 0}, {"key": "37084030", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5273165210629409, "ground_truth": 0}, {"key": "37084030", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5983122133920975, "ground_truth": 0}, {"key": "37084030", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366079137245, "ground_truth": 0}, {"key": "37084030", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717665962874383, "ground_truth": 0}, {"key": "39027295", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.46490157734002957, "ground_truth": 0}, {"key": "39027295", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6132365508803601, "ground_truth": 0}, {"key": "39027295", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6566582673070818, "ground_truth": 0}, {"key": "39027295", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154240148716324, "ground_truth": 0}, {"key": "39027295", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734839416854, "ground_truth": 0}, {"key": "14018647", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850108995513, "ground_truth": 0}, {"key": "14018647", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6297746346752682, "ground_truth": 0}, {"key": "14018647", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6352224322346675, "ground_truth": 0}, {"key": "14018647", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224146050254, "ground_truth": 0}, {"key": "14018647", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632843565653, "ground_truth": 0}, {"key": "37424289", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.962391360854774, "ground_truth": 0}, {"key": "37424289", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.972414717373263, "ground_truth": 0}, {"key": "37424289", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9681411444933729, "ground_truth": 0}, {"key": "37424289", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9572778022112659, "ground_truth": 0}, {"key": "37424289", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9629528349460286, "ground_truth": 0}, {"key": "37498031", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357624882845, "ground_truth": 0}, {"key": "37498031", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8872046047076612, "ground_truth": 0}, {"key": "37498031", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392929240984, "ground_truth": 0}, {"key": "37498031", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9420819126217655, "ground_truth": 0}, {"key": "37498031", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9319595795994292, "ground_truth": 0}, {"key": "30104095", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9136765236995659, "ground_truth": 0}, {"key": "30104095", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9086179052017453, "ground_truth": 0}, {"key": "30104095", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8652240784972012, "ground_truth": 0}, {"key": "30104095", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142457504491, "ground_truth": 0}, {"key": "30104095", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510359029943, "ground_truth": 0}, {"key": "37911407", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9079671422919326, "ground_truth": 0}, {"key": "37911407", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9481545347530821, "ground_truth": 0}, {"key": "37911407", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9465966647236023, "ground_truth": 0}, {"key": "37911407", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9399133479523123, "ground_truth": 0}, {"key": "37911407", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.95362179452373, "ground_truth": 0}, {"key": "39177472", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9066531265054312, "ground_truth": 0}, {"key": "39177472", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.887204603319332, "ground_truth": 0}, {"key": "39177472", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581552841597, "ground_truth": 0}, {"key": "39177472", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.856812298168713, "ground_truth": 0}, {"key": "39177472", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148266427137, "ground_truth": 0}, {"key": "32325454", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9173026593688244, "ground_truth": 0}, {"key": "32325454", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.876634373266818, "ground_truth": 0}, {"key": "32325454", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8365545706150931, "ground_truth": 0}, {"key": "32325454", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314710647131, "ground_truth": 0}, {"key": "32325454", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467659063098, "ground_truth": 0}, {"key": "38395319", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666699995678, "ground_truth": 0}, {"key": "38395319", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.700894819089613, "ground_truth": 0}, {"key": "38395319", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884701338378, "ground_truth": 0}, {"key": "38395319", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804325807669, "ground_truth": 0}, {"key": "38395319", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442250831588858, "ground_truth": 0}, {"key": "38235895", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6943026872569793, "ground_truth": 0}, {"key": "38235895", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6706082862721092, "ground_truth": 0}, {"key": "38235895", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8895288511567964, "ground_truth": 0}, {"key": "38235895", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154240072085594, "ground_truth": 0}, {"key": "38235895", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673034628983, "ground_truth": 0}, {"key": "26543267", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7279754421272713, "ground_truth": 0}, {"key": "26543267", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8548846367382981, "ground_truth": 0}, {"key": "26543267", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743552063438, "ground_truth": 0}, {"key": "26543267", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085869895352, "ground_truth": 0}, {"key": "26543267", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802474940291, "ground_truth": 0}, {"key": "39054728", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9594592624741612, "ground_truth": 0}, {"key": "39054728", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9726235115883127, "ground_truth": 0}, {"key": "39054728", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9572778050977745, "ground_truth": 0}, {"key": "39054728", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.952925820360116, "ground_truth": 0}, {"key": "39054728", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9640516771458474, "ground_truth": 0}, {"key": "39158443", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9190632907652521, "ground_truth": 0}, {"key": "39158443", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8799743679773687, "ground_truth": 0}, {"key": "39158443", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8947894652278919, "ground_truth": 0}, {"key": "39158443", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743711247657, "ground_truth": 0}, {"key": "39158443", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.858718582383796, "ground_truth": 0}, {"key": "36254201", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6169358479962381, "ground_truth": 0}, {"key": "36254201", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5350984198227718, "ground_truth": 0}, {"key": "36254201", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416390021776, "ground_truth": 0}, {"key": "36254201", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690637358129, "ground_truth": 0}, {"key": "36254201", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324915275417, "ground_truth": 0}, {"key": "23434347", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7606506615898646, "ground_truth": 0}, {"key": "23434347", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5813030948766017, "ground_truth": 0}, {"key": "23434347", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159648573566, "ground_truth": 0}, {"key": "23434347", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256478362098, "ground_truth": 0}, {"key": "23434347", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789129763288, "ground_truth": 0}, {"key": "34397620", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6334102818010229, "ground_truth": 0}, {"key": "34397620", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6224593152620055, "ground_truth": 0}, {"key": "34397620", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5602526576324611, "ground_truth": 0}, {"key": "34397620", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948059729506, "ground_truth": 0}, {"key": "34397620", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702541250125, "ground_truth": 0}, {"key": "34340916", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8407825908789122, "ground_truth": 0}, {"key": "34340916", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8056321813897519, "ground_truth": 0}, {"key": "34340916", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6636689528617709, "ground_truth": 0}, {"key": "34340916", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240868418997, "ground_truth": 0}, {"key": "34340916", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884632312606, "ground_truth": 0}, {"key": "30375089", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357487858693, "ground_truth": 0}, {"key": "30375089", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185943918452019, "ground_truth": 0}, {"key": "30375089", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8438951142564396, "ground_truth": 0}, {"key": "30375089", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647109316364, "ground_truth": 0}, {"key": "30375089", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527934783115, "ground_truth": 0}, {"key": "35807797", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9213576266574484, "ground_truth": 0}, {"key": "35807797", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8749346148215384, "ground_truth": 0}, {"key": "35807797", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.938124014670715, "ground_truth": 0}, {"key": "35807797", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.892562523420156, "ground_truth": 0}, {"key": "35807797", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876913724168, "ground_truth": 0}, {"key": "34188172", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8056321822225615, "ground_truth": 0}, {"key": "34188172", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6150878557955232, "ground_truth": 0}, {"key": "34188172", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7074047008514834, "ground_truth": 0}, {"key": "34188172", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672121483128, "ground_truth": 0}, {"key": "34188172", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746236377273, "ground_truth": 0}, {"key": "37075567", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9407897482103744, "ground_truth": 0}, {"key": "37075567", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142484122837, "ground_truth": 0}, {"key": "37075567", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9309620807414993, "ground_truth": 0}, {"key": "37075567", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213789075785, "ground_truth": 0}, {"key": "37075567", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9500414794244357, "ground_truth": 0}, {"key": "35559735", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7356416224564575, "ground_truth": 0}, {"key": "35559735", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526149894972, "ground_truth": 0}, {"key": "35559735", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637460223868, "ground_truth": 0}, {"key": "35559735", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849720128635, "ground_truth": 0}, {"key": "35559735", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943721172332, "ground_truth": 0}, {"key": "33005019", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6636689450761024, "ground_truth": 0}, {"key": "33005019", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6706082832299285, "ground_truth": 0}, {"key": "33005019", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.809275979335339, "ground_truth": 0}, {"key": "33005019", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891210682247, "ground_truth": 0}, {"key": "33005019", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916035983034, "ground_truth": 0}, {"key": "30808252", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7325918516290285, "ground_truth": 0}, {"key": "30808252", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680053741466, "ground_truth": 0}, {"key": "30808252", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7577943759337789, "ground_truth": 0}, {"key": "30808252", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919952998919, "ground_truth": 0}, {"key": "30808252", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300553879545, "ground_truth": 0}, {"key": "15159017", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6477982059457562, "ground_truth": 0}, {"key": "15159017", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8596637500403214, "ground_truth": 0}, {"key": "15159017", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.861538201777889, "ground_truth": 0}, {"key": "15159017", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.774583378868913, "ground_truth": 0}, {"key": "15159017", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.731058594431531, "ground_truth": 0}, {"key": "24493400", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7620701099476894, "ground_truth": 0}, {"key": "24493400", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672035108187, "ground_truth": 0}, {"key": "24493400", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.895522683519964, "ground_truth": 0}, {"key": "24493400", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163719454099, "ground_truth": 0}, {"key": "24493400", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869935300513, "ground_truth": 0}, {"key": "37791071", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8969755649638101, "ground_truth": 0}, {"key": "37791071", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9086179019929802, "ground_truth": 0}, {"key": "37791071", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9263037226818263, "ground_truth": 0}, {"key": "37791071", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583508186794, "ground_truth": 0}, {"key": "37791071", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361527247083, "ground_truth": 0}, {"key": "33528627", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8679338349717846, "ground_truth": 0}, {"key": "33528627", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7648916187321564, "ground_truth": 0}, {"key": "33528627", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7866228448657209, "ground_truth": 0}, {"key": "33528627", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951085517075, "ground_truth": 0}, {"key": "33528627", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441191574427, "ground_truth": 0}, {"key": "39925662", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8824278697001505, "ground_truth": 0}, {"key": "39925662", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9500414702001702, "ground_truth": 0}, {"key": "39925662", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9207896763709873, "ground_truth": 0}, {"key": "39925662", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204186785043, "ground_truth": 0}, {"key": "39925662", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972904899625, "ground_truth": 0}, {"key": "29213416", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6132365507789165, "ground_truth": 0}, {"key": "29213416", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7563575585213462, "ground_truth": 0}, {"key": "29213416", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094668103953, "ground_truth": 0}, {"key": "29213416", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316867538536, "ground_truth": 0}, {"key": "29213416", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837529822079, "ground_truth": 0}, {"key": "34492745", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5679365993665996, "ground_truth": 0}, {"key": "34492745", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6460136696849785, "ground_truth": 0}, {"key": "34492745", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5964331784483503, "ground_truth": 0}, {"key": "34492745", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191144863867, "ground_truth": 0}, {"key": "34492745", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.672331694816314, "ground_truth": 0}, {"key": "34191937", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7549149915005775, "ground_truth": 0}, {"key": "34191937", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6020615901524176, "ground_truth": 0}, {"key": "34191937", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.840782603683971, "ground_truth": 0}, {"key": "34191937", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.721743184052506, "ground_truth": 0}, {"key": "34191937", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983122173369174, "ground_truth": 0}, {"key": "34933372", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.901920687512072, "ground_truth": 0}, {"key": "34933372", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142450323677, "ground_truth": 0}, {"key": "34933372", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9196425326424925, "ground_truth": 0}, {"key": "34933372", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.889528844221763, "ground_truth": 0}, {"key": "34933372", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206761834201, "ground_truth": 0}, {"key": "38714379", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9722043799678449, "ground_truth": 0}, {"key": "38714379", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9525741332618709, "ground_truth": 0}, {"key": "38714379", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9618217287478044, "ground_truth": 0}, {"key": "38714379", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9661559649797223, "ground_truth": 0}, {"key": "38714379", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9563089434407007, "ground_truth": 0}, {"key": "39220660", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675348498344, "ground_truth": 0}, {"key": "39220660", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9469902329042156, "ground_truth": 0}, {"key": "39220660", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.91117971184871, "ground_truth": 0}, {"key": "39220660", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009502914468, "ground_truth": 0}, {"key": "39220660", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467672973389, "ground_truth": 0}, {"key": "41028780", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357648097603, "ground_truth": 0}, {"key": "41028780", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.835483530204431, "ground_truth": 0}, {"key": "41028780", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.865224081831523, "ground_truth": 0}, {"key": "41028780", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585865229045, "ground_truth": 0}, {"key": "41028780", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690890997324, "ground_truth": 0}, {"key": "39457108", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7074046934156877, "ground_truth": 0}, {"key": "39457108", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5525397336466672, "ground_truth": 0}, {"key": "39457108", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718434828849768, "ground_truth": 0}, {"key": "39457108", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690694336998, "ground_truth": 0}, {"key": "39457108", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666442892429, "ground_truth": 0}, {"key": "38288018", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7106283079912622, "ground_truth": 0}, {"key": "38288018", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6039318329813043, "ground_truth": 0}, {"key": "38288018", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6688802622736371, "ground_truth": 0}, {"key": "38288018", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125607198, "ground_truth": 0}, {"key": "38288018", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046914930043, "ground_truth": 0}, {"key": "40106293", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5273165274015853, "ground_truth": 0}, {"key": "40106293", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424324590703246, "ground_truth": 0}, {"key": "40106293", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4726834653584796, "ground_truth": 0}, {"key": "40106293", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544167622309, "ground_truth": 0}, {"key": "40106293", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.36840568847057814, "ground_truth": 0}, {"key": "39948797", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.827828167501132, "ground_truth": 0}, {"key": "39948797", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681064538439, "ground_truth": 0}, {"key": "39948797", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8652240717651265, "ground_truth": 0}, {"key": "39948797", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943518709873, "ground_truth": 0}, {"key": "39948797", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.863391620831955, "ground_truth": 0}, {"key": "31853399", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8998277764061761, "ground_truth": 0}, {"key": "31853399", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8624675369700565, "ground_truth": 0}, {"key": "31853399", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.884837769455041, "ground_truth": 0}, {"key": "31853399", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898241263844, "ground_truth": 0}, {"key": "31853399", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919738948266, "ground_truth": 0}, {"key": "35273252", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7446563496265277, "ground_truth": 0}, {"key": "35273252", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6757646205214651, "ground_truth": 0}, {"key": "35273252", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581754294646, "ground_truth": 0}, {"key": "35273252", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352796281047, "ground_truth": 0}, {"key": "35273252", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251135652041, "ground_truth": 0}, {"key": "37130459", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.970239905379021, "ground_truth": 0}, {"key": "37130459", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9798226797098437, "ground_truth": 0}, {"key": "37130459", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.948154537555082, "ground_truth": 0}, {"key": "37130459", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9626731132049355, "ground_truth": 0}, {"key": "37130459", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9790357583826547, "ground_truth": 0}, {"key": "21734003", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8856314701727616, "ground_truth": 0}, {"key": "21734003", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9005297909061294, "ground_truth": 0}, {"key": "21734003", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8469578299377197, "ground_truth": 0}, {"key": "21734003", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797082713563, "ground_truth": 0}, {"key": "21734003", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916059990046, "ground_truth": 0}, {"key": "33990737", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7416740180474185, "ground_truth": 0}, {"key": "33990737", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7648916111415149, "ground_truth": 0}, {"key": "33990737", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.764891589939887, "ground_truth": 0}, {"key": "33990737", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297745968850855, "ground_truth": 0}, {"key": "33990737", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527744060373, "ground_truth": 0}, {"key": "34559912", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675160735703, "ground_truth": 0}, {"key": "34559912", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9059898284573276, "ground_truth": 0}, {"key": "34559912", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215315430751, "ground_truth": 0}, {"key": "34559912", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.872347377252885, "ground_truth": 0}, {"key": "34559912", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846417332545, "ground_truth": 0}, {"key": "39820439", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.3775406793961713, "ground_truth": 0}, {"key": "39820439", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5640984590439962, "ground_truth": 0}, {"key": "39820439", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5602526751001468, "ground_truth": 0}, {"key": "39820439", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116471878284506, "ground_truth": 0}, {"key": "39820439", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132650697538873, "ground_truth": 0}, {"key": "34759328", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8509647202224777, "ground_truth": 0}, {"key": "34759328", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9230391712733705, "ground_truth": 0}, {"key": "34759328", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933093927038229, "ground_truth": 0}, {"key": "34759328", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361497844935, "ground_truth": 0}, {"key": "34759328", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972776855609, "ground_truth": 0}, {"key": "36939137", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431680006749253, "ground_truth": 0}, {"key": "36939137", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8824278601855212, "ground_truth": 0}, {"key": "36939137", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799929065235635, "ground_truth": 0}, {"key": "36939137", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578460564108, "ground_truth": 0}, {"key": "36939137", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916018976967, "ground_truth": 0}, {"key": "35851522", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8140528248712092, "ground_truth": 0}, {"key": "35851522", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8278281639776638, "ground_truth": 0}, {"key": "35851522", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581709851301, "ground_truth": 0}, {"key": "35851522", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601331577924, "ground_truth": 0}, {"key": "35851522", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637474957527, "ground_truth": 0}, {"key": "22412782", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6808786259907905, "ground_truth": 0}, {"key": "22412782", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956581082150793, "ground_truth": 0}, {"key": "22412782", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416446802794, "ground_truth": 0}, {"key": "22412782", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.724870257544022, "ground_truth": 0}, {"key": "22412782", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256011631416, "ground_truth": 0}, {"key": "38579227", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9136765230908167, "ground_truth": 0}, {"key": "38579227", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9381240107562528, "ground_truth": 0}, {"key": "38579227", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9219218364808663, "ground_truth": 0}, {"key": "38579227", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.934872452410619, "ground_truth": 0}, {"key": "38579227", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9489172610291076, "ground_truth": 0}, {"key": "37206995", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9099070050539315, "ground_truth": 0}, {"key": "37206995", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9019206739942088, "ground_truth": 0}, {"key": "37206995", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9161096115921421, "ground_truth": 0}, {"key": "37206995", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361581770846, "ground_truth": 0}, {"key": "37206995", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045894181579, "ground_truth": 0}, {"key": "38700847", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9353465080810568, "ground_truth": 0}, {"key": "38700847", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9437636546775438, "ground_truth": 0}, {"key": "38700847", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9546474198220238, "ground_truth": 0}, {"key": "38700847", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9582261177172612, "ground_truth": 0}, {"key": "38700847", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9485372367619144, "ground_truth": 0}, {"key": "20246590", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9892648366831069, "ground_truth": 0}, {"key": "20246590", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9958980707477568, "ground_truth": 0}, {"key": "20246590", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.994739147566929, "ground_truth": 0}, {"key": "20246590", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9875683494039981, "ground_truth": 0}, {"key": "20246590", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9793540670707211, "ground_truth": 0}, {"key": "39141360", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601238979989, "ground_truth": 0}, {"key": "39141360", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6791787053585421, "ground_truth": 0}, {"key": "39141360", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.794384963791868, "ground_truth": 0}, {"key": "39141360", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933400819338, "ground_truth": 0}, {"key": "39141360", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736783945231031, "ground_truth": 0}, {"key": "37906226", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5428632332446225, "ground_truth": 0}, {"key": "37906226", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5312093676079882, "ground_truth": 0}, {"key": "37906226", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5525396982657825, "ground_truth": 0}, {"key": "37906226", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.661922881599554, "ground_truth": 0}, {"key": "37906226", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165036156763, "ground_truth": 0}, {"key": "16201033", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195121727045, "ground_truth": 0}, {"key": "16201033", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8311430454213432, "ground_truth": 0}, {"key": "16201033", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6774740160400268, "ground_truth": 0}, {"key": "16201033", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.704160136420709, "ground_truth": 0}, {"key": "16201033", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548719893333, "ground_truth": 0}, {"key": "36469022", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7592253881878478, "ground_truth": 0}, {"key": "36469022", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300504022854, "ground_truth": 0}, {"key": "36469022", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7386690867144807, "ground_truth": 0}, {"key": "36469022", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943624781459, "ground_truth": 0}, {"key": "36469022", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804461516859, "ground_truth": 0}, {"key": "31295270", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.667147670931592, "ground_truth": 0}, {"key": "31295270", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8255897244598781, "ground_truth": 0}, {"key": "31295270", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6513548544608735, "ground_truth": 0}, {"key": "31295270", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575494852304, "ground_truth": 0}, {"key": "31295270", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056458765026, "ground_truth": 0}, {"key": "35360689", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5813030965303767, "ground_truth": 0}, {"key": "35360689", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.40356686439170203, "ground_truth": 0}, {"key": "35360689", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4668456181150181, "ground_truth": 0}, {"key": "35360689", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387583026278465, "ground_truth": 0}, {"key": "35360689", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397004731164, "ground_truth": 0}, {"key": "29202793", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.684264008790122, "ground_truth": 0}, {"key": "29202793", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026766498552, "ground_truth": 0}, {"key": "29202793", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.646013710157979, "ground_truth": 0}, {"key": "29202793", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094579565028, "ground_truth": 0}, {"key": "29202793", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512699069723, "ground_truth": 0}, {"key": "35999008", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850173469645, "ground_truth": 0}, {"key": "35999008", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6150878552698803, "ground_truth": 0}, {"key": "35999008", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7122321949643327, "ground_truth": 0}, {"key": "35999008", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279511964514288, "ground_truth": 0}, {"key": "35999008", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159658637547, "ground_truth": 0}, {"key": "31797119", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625184487551, "ground_truth": 0}, {"key": "31797119", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9059898185411563, "ground_truth": 0}, {"key": "31797119", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.847967761056692, "ground_truth": 0}, {"key": "31797119", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9136765244132302, "ground_truth": 0}, {"key": "31797119", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274174638987, "ground_truth": 0}, {"key": "26711893", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7025300279399604, "ground_truth": 0}, {"key": "26711893", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.793105945292321, "ground_truth": 0}, {"key": "26711893", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8749346326722853, "ground_truth": 0}, {"key": "26711893", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423201185017, "ground_truth": 0}, {"key": "26711893", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324934443372, "ground_truth": 0}, {"key": "35348288", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5544704562078614, "ground_truth": 0}, {"key": "35348288", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.42250459861075035, "ground_truth": 0}, {"key": "35348288", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6442251071795765, "ground_truth": 0}, {"key": "35348288", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046981045808, "ground_truth": 0}, {"key": "35348288", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089408154554, "ground_truth": 0}, {"key": "38124131", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4436004089719362, "ground_truth": 0}, {"key": "38124131", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4455295591737689, "ground_truth": 0}, {"key": "38124131", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6388352661658355, "ground_truth": 0}, {"key": "38124131", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352551016825, "ground_truth": 0}, {"key": "38124131", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216117725435, "ground_truth": 0}, {"key": "20285901", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8255897192814995, "ground_truth": 0}, {"key": "20285901", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026753484919, "ground_truth": 0}, {"key": "20285901", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.740174349393089, "ground_truth": 0}, {"key": "20285901", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154240191045507, "ground_truth": 0}, {"key": "20285901", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.863391613136181, "ground_truth": 0}, {"key": "35633632", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163677559818, "ground_truth": 0}, {"key": "35633632", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8019358223262278, "ground_truth": 0}, {"key": "35633632", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7341195280530872, "ground_truth": 0}, {"key": "35633632", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336840309718, "ground_truth": 0}, {"key": "35633632", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789026543522, "ground_truth": 0}, {"key": "10741274", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6893055993673776, "ground_truth": 0}, {"key": "10741274", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7310586012512869, "ground_truth": 0}, {"key": "10741274", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6495786231572723, "ground_truth": 0}, {"key": "10741274", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477981946087398, "ground_truth": 0}, {"key": "10741274", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833944097702, "ground_truth": 0}, {"key": "30605795", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7325918517521234, "ground_truth": 0}, {"key": "30605795", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7325918460784074, "ground_truth": 0}, {"key": "30605795", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8509647121377438, "ground_truth": 0}, {"key": "30605795", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872186698045, "ground_truth": 0}, {"key": "30605795", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118930307575, "ground_truth": 0}, {"key": "30539722", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7826624792897765, "ground_truth": 0}, {"key": "30539722", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.799442301815117, "ground_truth": 0}, {"key": "30539722", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094760675377, "ground_truth": 0}, {"key": "30539722", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867566071716, "ground_truth": 0}, {"key": "30539722", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762779892888, "ground_truth": 0}, {"key": "18639299", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7839884530157403, "ground_truth": 0}, {"key": "18639299", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6740504881443106, "ground_truth": 0}, {"key": "18639299", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6992544305068964, "ground_truth": 0}, {"key": "18639299", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666549175908, "ground_truth": 0}, {"key": "18639299", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737453349372, "ground_truth": 0}, {"key": "39773552", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9425067261210487, "ground_truth": 0}, {"key": "39773552", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9582261211665639, "ground_truth": 0}, {"key": "39773552", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9196425325524882, "ground_truth": 0}, {"key": "39773552", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9553191292013239, "ground_truth": 0}, {"key": "39773552", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.937210792900612, "ground_truth": 0}, {"key": "34086410", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5253688304710961, "ground_truth": 0}, {"key": "34086410", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5544704832120092, "ground_truth": 0}, {"key": "34086410", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5774953736167681, "ground_truth": 0}, {"key": "34086410", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026834035435, "ground_truth": 0}, {"key": "34086410", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774739921561713, "ground_truth": 0}, {"key": "35454652", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431679826072671, "ground_truth": 0}, {"key": "35454652", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.861538201294835, "ground_truth": 0}, {"key": "35454652", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7520125786163522, "ground_truth": 0}, {"key": "35454652", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185944026038611, "ground_truth": 0}, {"key": "35454652", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575629756886, "ground_truth": 0}, {"key": "36158310", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.804405924640486, "ground_truth": 0}, {"key": "36158310", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5907791787959484, "ground_truth": 0}, {"key": "36158310", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8289388076299025, "ground_truth": 0}, {"key": "36158310", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891268329586, "ground_truth": 0}, {"key": "36158310", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300567863755, "ground_truth": 0}, {"key": "35688387", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6113819731453431, "ground_truth": 0}, {"key": "35688387", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8322366547622521, "ground_truth": 0}, {"key": "35688387", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5794004224349849, "ground_truth": 0}, {"key": "35688387", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358609648204, "ground_truth": 0}, {"key": "35688387", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292634021280633, "ground_truth": 0}, {"key": "34209292", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797620854607, "ground_truth": 0}, {"key": "34209292", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6688802366220751, "ground_truth": 0}, {"key": "34209292", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7826624648601841, "ground_truth": 0}, {"key": "34209292", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.834406878344832, "ground_truth": 0}, {"key": "34209292", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802440050927, "ground_truth": 0}, {"key": "25037859", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6740504986343745, "ground_truth": 0}, {"key": "25037859", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6150878817371012, "ground_truth": 0}, {"key": "25037859", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.611381967914242, "ground_truth": 0}, {"key": "25037859", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163752096475, "ground_truth": 0}, {"key": "25037859", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105502386315, "ground_truth": 0}, {"key": "36412121", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9184802365472866, "ground_truth": 0}, {"key": "36412121", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9178933700373535, "ground_truth": 0}, {"key": "36412121", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9343951695831235, "ground_truth": 0}, {"key": "36412121", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9469902282993792, "ground_truth": 0}, {"key": "36412121", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070140509204, "ground_truth": 0}, {"key": "34909172", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.744656342276725, "ground_truth": 0}, {"key": "34909172", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5621765064537081, "ground_truth": 0}, {"key": "34909172", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6859494541629929, "ground_truth": 0}, {"key": "34909172", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026855276097, "ground_truth": 0}, {"key": "34909172", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646088129121, "ground_truth": 0}, {"key": "39011806", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9059898119515418, "ground_truth": 0}, {"key": "39011806", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9489172628548976, "ground_truth": 0}, {"key": "39011806", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.960062680651383, "ground_truth": 0}, {"key": "39011806", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9372107913036547, "ground_truth": 0}, {"key": "39011806", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037327615917, "ground_truth": 0}, {"key": "33096163", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8289388235185422, "ground_truth": 0}, {"key": "33096163", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145889566591, "ground_truth": 0}, {"key": "33096163", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366518983103, "ground_truth": 0}, {"key": "33096163", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163765963505, "ground_truth": 0}, {"key": "33096163", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624796081652, "ground_truth": 0}, {"key": "38762205", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9190632914696509, "ground_truth": 0}, {"key": "38762205", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.945801272747846, "ground_truth": 0}, {"key": "38762205", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9241418210385369, "ground_truth": 0}, {"key": "38762205", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9635062278680939, "ground_truth": 0}, {"key": "38762205", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425285291087, "ground_truth": 0}, {"key": "35519177", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9066531222212076, "ground_truth": 0}, {"key": "35519177", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526329659156, "ground_truth": 0}, {"key": "35519177", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9329437092870653, "ground_truth": 0}, {"key": "35519177", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377780428945, "ground_truth": 0}, {"key": "35519177", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204076999809, "ground_truth": 0}, {"key": "36192531", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7090191072494227, "ground_truth": 0}, {"key": "36192531", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.859663751843042, "ground_truth": 0}, {"key": "36192531", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7461389971702714, "ground_truth": 0}, {"key": "36192531", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324946210773, "ground_truth": 0}, {"key": "36192531", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324899656773, "ground_truth": 0}, {"key": "33160852", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9553191284321705, "ground_truth": 0}, {"key": "33160852", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9738443819632134, "ground_truth": 0}, {"key": "33160852", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9775429439670149, "ground_truth": 0}, {"key": "33160852", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9755769094368326, "ground_truth": 0}, {"key": "33160852", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9606574962346018, "ground_truth": 0}, {"key": "36312304", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5640985032617875, "ground_truth": 0}, {"key": "36312304", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6150878351851863, "ground_truth": 0}, {"key": "36312304", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7041601209655112, "ground_truth": 0}, {"key": "36312304", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011380335073, "ground_truth": 0}, {"key": "36312304", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601724297710831, "ground_truth": 0}, {"key": "33773343", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6424324885877674, "ground_truth": 0}, {"key": "33773343", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185943977004627, "ground_truth": 0}, {"key": "33773343", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884641001643, "ground_truth": 0}, {"key": "33773343", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898355865946, "ground_truth": 0}, {"key": "33773343", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884585522799, "ground_truth": 0}, {"key": "34913320", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5640984901976361, "ground_truth": 0}, {"key": "34913320", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.712232206251087, "ground_truth": 0}, {"key": "34913320", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6808786121167085, "ground_truth": 0}, {"key": "34913320", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366091398058, "ground_truth": 0}, {"key": "34913320", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.720171500023257, "ground_truth": 0}, {"key": "33784155", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8019358302033331, "ground_truth": 0}, {"key": "33784155", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8499711748329776, "ground_truth": 0}, {"key": "33784155", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9130583483358375, "ground_truth": 0}, {"key": "33784155", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118808485471, "ground_truth": 0}, {"key": "33784155", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762712762649, "ground_truth": 0}, {"key": "24085062", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9868787290209495, "ground_truth": 0}, {"key": "24085062", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9974688887968426, "ground_truth": 0}, {"key": "24085062", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9832145096311501, "ground_truth": 0}, {"key": "24085062", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9890976263964966, "ground_truth": 0}, {"key": "24085062", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9924227590581619, "ground_truth": 0}, {"key": "33893487", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5214711789936186, "ground_truth": 0}, {"key": "33893487", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.3960681508485857, "ground_truth": 0}, {"key": "33893487", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.40922079534315325, "ground_truth": 0}, {"key": "33893487", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199023763405, "ground_truth": 0}, {"key": "33893487", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378235104221625, "ground_truth": 0}, {"key": "40913011", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9339146213642365, "ground_truth": 0}, {"key": "40913011", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9130583457574708, "ground_truth": 0}, {"key": "40913011", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9485372354087107, "ground_truth": 0}, {"key": "40913011", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583492354495, "ground_truth": 0}, {"key": "40913011", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.919642533064863, "ground_truth": 0}, {"key": "29642545", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5698526538963723, "ground_truth": 0}, {"key": "29642545", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6601723861414525, "ground_truth": 0}, {"key": "29642545", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837677519399, "ground_truth": 0}, {"key": "29642545", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300756613585, "ground_truth": 0}, {"key": "29642545", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872069859256, "ground_truth": 0}, {"key": "35969159", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7918210708854195, "ground_truth": 0}, {"key": "35969159", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7981867812582863, "ground_truth": 0}, {"key": "35969159", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.741674020765085, "ground_truth": 0}, {"key": "35969159", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637512495924, "ground_truth": 0}, {"key": "35969159", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431679935930455, "ground_truth": 0}, {"key": "37081669", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.46101680338234713, "ground_truth": 0}, {"key": "37081669", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6876299902446271, "ground_truth": 0}, {"key": "37081669", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5736784108612323, "ground_truth": 0}, {"key": "37081669", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102555320269, "ground_truth": 0}, {"key": "37081669", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640441699303, "ground_truth": 0}, {"key": "40048022", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7918210832833777, "ground_truth": 0}, {"key": "40048022", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8940517144931206, "ground_truth": 0}, {"key": "40048022", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7620701157789582, "ground_truth": 0}, {"key": "40048022", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307722211196, "ground_truth": 0}, {"key": "40048022", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.65665827266538, "ground_truth": 0}, {"key": "32884004", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9429286054410163, "ground_truth": 0}, {"key": "32884004", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9299510386729417, "ground_truth": 0}, {"key": "32884004", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.897695294698398, "ground_truth": 0}, {"key": "32884004", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213760557636, "ground_truth": 0}, {"key": "32884004", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297837354646, "ground_truth": 0}, {"key": "39022490", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303142640522, "ground_truth": 0}, {"key": "39022490", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8469578444401177, "ground_truth": 0}, {"key": "39022490", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199639417258, "ground_truth": 0}, {"key": "39022490", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637438032224, "ground_truth": 0}, {"key": "39022490", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528132885645, "ground_truth": 0}, {"key": "35159385", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059478945297, "ground_truth": 0}, {"key": "35159385", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799928888029308, "ground_truth": 0}, {"key": "35159385", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7620701073472436, "ground_truth": 0}, {"key": "35159385", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.77458337588035, "ground_truth": 0}, {"key": "35159385", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388103567082, "ground_truth": 0}, {"key": "34363669", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5679366010615381, "ground_truth": 0}, {"key": "34363669", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5195213265280234, "ground_truth": 0}, {"key": "34363669", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6842640118279122, "ground_truth": 0}, {"key": "34363669", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166155041085, "ground_truth": 0}, {"key": "34363669", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270069573986, "ground_truth": 0}, {"key": "36119687", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9681411454975716, "ground_truth": 0}, {"key": "36119687", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.926835284508609, "ground_truth": 0}, {"key": "36119687", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9353465077619021, "ground_truth": 0}, {"key": "36119687", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9566341979843701, "ground_truth": 0}, {"key": "36119687", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9632305356027663, "ground_truth": 0}, {"key": "35217446", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.757794360169852, "ground_truth": 0}, {"key": "35217446", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7826624805242596, "ground_truth": 0}, {"key": "35217446", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8955226906077294, "ground_truth": 0}, {"key": "35217446", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647069635862, "ground_truth": 0}, {"key": "35217446", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127601219779, "ground_truth": 0}, {"key": "39049331", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7025300760382229, "ground_truth": 0}, {"key": "39049331", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680173026014, "ground_truth": 0}, {"key": "39049331", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7057850421491779, "ground_truth": 0}, {"key": "39049331", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951024881592, "ground_truth": 0}, {"key": "39049331", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545687302846, "ground_truth": 0}, {"key": "36472242", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526035742928, "ground_truth": 0}, {"key": "36472242", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744712983699, "ground_truth": 0}, {"key": "36472242", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.87059727146801, "ground_truth": 0}, {"key": "36472242", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916005390689, "ground_truth": 0}, {"key": "36472242", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519527996900906, "ground_truth": 0}, {"key": "31854721", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281745606336, "ground_truth": 0}, {"key": "31854721", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8469578471575867, "ground_truth": 0}, {"key": "31854721", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8824278599775509, "ground_truth": 0}, {"key": "31854721", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916106268638, "ground_truth": 0}, {"key": "31854721", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789065398775, "ground_truth": 0}, {"key": "18725849", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7090191431824742, "ground_truth": 0}, {"key": "18725849", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6601723776090226, "ground_truth": 0}, {"key": "18725849", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6513548573606845, "ground_truth": 0}, {"key": "18725849", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321801610226, "ground_truth": 0}, {"key": "18725849", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118721921025, "ground_truth": 0}, {"key": "36883179", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5389832302436572, "ground_truth": 0}, {"key": "36883179", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5350984127208379, "ground_truth": 0}, {"key": "36883179", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5253687986545096, "ground_truth": 0}, {"key": "36883179", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203151792938, "ground_truth": 0}, {"key": "36883179", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869690734310244, "ground_truth": 0}, {"key": "34266359", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.762070126683538, "ground_truth": 0}, {"key": "34266359", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.825589732366675, "ground_truth": 0}, {"key": "34266359", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879312013698653, "ground_truth": 0}, {"key": "34266359", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898322322218, "ground_truth": 0}, {"key": "34266359", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826625060669281, "ground_truth": 0}, {"key": "31920289", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6842640313262603, "ground_truth": 0}, {"key": "31920289", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026930298508, "ground_truth": 0}, {"key": "31920289", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6169358043688953, "ground_truth": 0}, {"key": "31920289", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688298139911, "ground_truth": 0}, {"key": "31920289", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268346691718727, "ground_truth": 0}, {"key": "36292997", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437654752076, "ground_truth": 0}, {"key": "36292997", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.806852629343157, "ground_truth": 0}, {"key": "36292997", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8255897378443907, "ground_truth": 0}, {"key": "36292997", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.867035760721511, "ground_truth": 0}, {"key": "36292997", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789184589282, "ground_truth": 0}, {"key": "30412533", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8164063703571389, "ground_truth": 0}, {"key": "30412533", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619280060489, "ground_truth": 0}, {"key": "30412533", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7505527613469072, "ground_truth": 0}, {"key": "30412533", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738128667483, "ground_truth": 0}, {"key": "30412533", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445477583324, "ground_truth": 0}, {"key": "40433191", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9246876888184927, "ground_truth": 0}, {"key": "40433191", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.917302658264475, "ground_truth": 0}, {"key": "40433191", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9319595779258121, "ground_truth": 0}, {"key": "40433191", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9437636541869632, "ground_truth": 0}, {"key": "40433191", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105559088931, "ground_truth": 0}, {"key": "34565591", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5698526537740055, "ground_truth": 0}, {"key": "34565591", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6315942872865172, "ground_truth": 0}, {"key": "34565591", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416481329319, "ground_truth": 0}, {"key": "34565591", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.616935828149704, "ground_truth": 0}, {"key": "34565591", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.41489883067430616, "ground_truth": 0}, {"key": "36062480", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8984105574647143, "ground_truth": 0}, {"key": "36062480", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267118139592553, "ground_truth": 0}, {"key": "36062480", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9429285988515961, "ground_truth": 0}, {"key": "36062480", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9309620717455621, "ground_truth": 0}, {"key": "36062480", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149036697641, "ground_truth": 0}, {"key": "37276883", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8705972578236382, "ground_truth": 0}, {"key": "37276883", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233284059207467, "ground_truth": 0}, {"key": "37276883", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9026096045305986, "ground_truth": 0}, {"key": "37276883", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681109914161, "ground_truth": 0}, {"key": "37276883", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127553702476, "ground_truth": 0}, {"key": "38509260", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8661325052526465, "ground_truth": 0}, {"key": "38509260", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8933094104093007, "ground_truth": 0}, {"key": "38509260", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8872045887587353, "ground_truth": 0}, {"key": "38509260", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185908179774, "ground_truth": 0}, {"key": "38509260", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388118472437, "ground_truth": 0}, {"key": "37139607", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9637799417388528, "ground_truth": 0}, {"key": "37139607", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9724147167768409, "ground_truth": 0}, {"key": "37139607", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9525741292789148, "ground_truth": 0}, {"key": "37139607", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9761291652558064, "ground_truth": 0}, {"key": "37139607", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9543079672996465, "ground_truth": 0}, {"key": "37092824", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9837225395642033, "ground_truth": 0}, {"key": "37092824", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9811668696496151, "ground_truth": 0}, {"key": "37092824", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9717790129836658, "ground_truth": 0}, {"key": "37092824", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9591542817901999, "ground_truth": 0}, {"key": "37092824", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9753900683683446, "ground_truth": 0}, {"key": "32191802", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.894051699079009, "ground_truth": 0}, {"key": "32191802", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8489722057407009, "ground_truth": 0}, {"key": "32191802", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9079671393152425, "ground_truth": 0}, {"key": "32191802", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9314625025335854, "ground_truth": 0}, {"key": "32191802", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009554505538, "ground_truth": 0}, {"key": "39396038", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9556514184404498, "ground_truth": 0}, {"key": "39396038", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9273632892074822, "ground_truth": 0}, {"key": "39396038", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.933914624253465, "ground_truth": 0}, {"key": "39396038", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9381240094118032, "ground_truth": 0}, {"key": "39396038", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510441665619, "ground_truth": 0}, {"key": "39076884", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8354835401593327, "ground_truth": 0}, {"key": "39076884", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545744589243, "ground_truth": 0}, {"key": "39076884", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631606123483, "ground_truth": 0}, {"key": "39076884", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127672641733, "ground_truth": 0}, {"key": "39076884", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239713996321, "ground_truth": 0}, {"key": "27763432", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6297746075474265, "ground_truth": 0}, {"key": "27763432", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.43014735174729574, "ground_truth": 0}, {"key": "27763432", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6001883934737855, "ground_truth": 0}, {"key": "27763432", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228908236783, "ground_truth": 0}, {"key": "27763432", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206215997866966, "ground_truth": 0}, {"key": "37806929", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.939024814214408, "ground_truth": 0}, {"key": "37806929", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9433475778269818, "ground_truth": 0}, {"key": "37806929", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9515039952671872, "ground_truth": 0}, {"key": "37806929", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9588471124064507, "ground_truth": 0}, {"key": "37806929", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9643214440407003, "ground_truth": 0}, {"key": "32334186", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7090191320335565, "ground_truth": 0}, {"key": "32334186", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6909762956117019, "ground_truth": 0}, {"key": "32334186", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6791786990394635, "ground_truth": 0}, {"key": "32334186", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437639208711, "ground_truth": 0}, {"key": "32334186", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933308326294, "ground_truth": 0}, {"key": "36187324", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9543079683512637, "ground_truth": 0}, {"key": "36187324", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.930458250639785, "ground_truth": 0}, {"key": "36187324", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9469902305861054, "ground_truth": 0}, {"key": "36187324", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767911057909, "ground_truth": 0}, {"key": "36187324", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9556514220367323, "ground_truth": 0}, {"key": "35306009", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9686195737501957, "ground_truth": 0}, {"key": "35306009", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9766692299991224, "ground_truth": 0}, {"key": "35306009", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.968619566661086, "ground_truth": 0}, {"key": "35306009", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9791955094383424, "ground_truth": 0}, {"key": "35306009", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9768465865918528, "ground_truth": 0}, {"key": "39490050", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6388353042947279, "ground_truth": 0}, {"key": "39490050", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7170118856021479, "ground_truth": 0}, {"key": "39490050", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6601723757510568, "ground_truth": 0}, {"key": "39490050", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878602386382, "ground_truth": 0}, {"key": "39490050", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643738960144, "ground_truth": 0}, {"key": "38072149", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6774740151517593, "ground_truth": 0}, {"key": "38072149", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7090191398361069, "ground_truth": 0}, {"key": "38072149", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163734582878, "ground_truth": 0}, {"key": "38072149", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339614982148, "ground_truth": 0}, {"key": "38072149", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672194372901, "ground_truth": 0}, {"key": "35899689", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867908036057, "ground_truth": 0}, {"key": "35899689", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7090191320624621, "ground_truth": 0}, {"key": "35899689", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163412611402, "ground_truth": 0}, {"key": "35899689", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760334216403, "ground_truth": 0}, {"key": "35899689", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.881614912637238, "ground_truth": 0}, {"key": "27994518", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7826624792373806, "ground_truth": 0}, {"key": "27994518", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.818736776891657, "ground_truth": 0}, {"key": "27994518", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8984105557203181, "ground_truth": 0}, {"key": "27994518", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581145070283, "ground_truth": 0}, {"key": "27994518", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063751073839, "ground_truth": 0}, {"key": "10615479", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5234203631842496, "ground_truth": 0}, {"key": "10615479", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6057990550769626, "ground_truth": 0}, {"key": "10615479", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.726425615430753, "ground_truth": 0}, {"key": "10615479", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015716385133, "ground_truth": 0}, {"key": "10615479", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308069735637, "ground_truth": 0}, {"key": "40186667", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204127846074, "ground_truth": 0}, {"key": "40186667", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7138307575575026, "ground_truth": 0}, {"key": "40186667", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8652240955008182, "ground_truth": 0}, {"key": "40186667", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366601418388, "ground_truth": 0}, {"key": "40186667", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872087742354, "ground_truth": 0}, {"key": "38622886", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059594815723, "ground_truth": 0}, {"key": "38622886", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619212977172, "ground_truth": 0}, {"key": "38622886", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256542823009, "ground_truth": 0}, {"key": "38622886", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325161490688, "ground_truth": 0}, {"key": "38622886", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358275630407, "ground_truth": 0}, {"key": "40686943", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228217843283, "ground_truth": 0}, {"key": "40686943", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059628880871, "ground_truth": 0}, {"key": "40686943", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7931059416557562, "ground_truth": 0}, {"key": "40686943", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324878566445, "ground_truth": 0}, {"key": "40686943", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972759800058, "ground_truth": 0}, {"key": "30604567", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9801292847908748, "ground_truth": 0}, {"key": "30604567", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9722043751234862, "ground_truth": 0}, {"key": "30604567", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9845754480798858, "ground_truth": 0}, {"key": "30604567", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9833429601724479, "ground_truth": 0}, {"key": "30604567", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9799765601122956, "ground_truth": 0}, {"key": "35440903", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7634837572988128, "ground_truth": 0}, {"key": "35440903", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7549149844573947, "ground_truth": 0}, {"key": "35440903", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8175744724712838, "ground_truth": 0}, {"key": "35440903", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583221033554, "ground_truth": 0}, {"key": "35440903", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199706924726, "ground_truth": 0}, {"key": "37219533", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5660185278284783, "ground_truth": 0}, {"key": "37219533", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6909762743936356, "ground_truth": 0}, {"key": "37219533", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6334102402735264, "ground_truth": 0}, {"key": "37219533", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122113298095, "ground_truth": 0}, {"key": "37219533", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704648003200465, "ground_truth": 0}, {"key": "40178965", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8840392946975296, "ground_truth": 0}, {"key": "40178965", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8910549518208655, "ground_truth": 0}, {"key": "40178965", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142533169401, "ground_truth": 0}, {"key": "40178965", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204095367244, "ground_truth": 0}, {"key": "40178965", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8887587910123393, "ground_truth": 0}, {"key": "13750468", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8918110455696526, "ground_truth": 0}, {"key": "13750468", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7690802421041534, "ground_truth": 0}, {"key": "13750468", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718434964750225, "ground_truth": 0}, {"key": "13750468", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970751892591, "ground_truth": 0}, {"key": "13750468", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085728516845, "ground_truth": 0}, {"key": "17754949", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976089238937474, "ground_truth": 0}, {"key": "17754949", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5945512738919443, "ground_truth": 0}, {"key": "17754949", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159532803411, "ground_truth": 0}, {"key": "17754949", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085828505815, "ground_truth": 0}, {"key": "17754949", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936654559347, "ground_truth": 0}, {"key": "36675623", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9658995765481801, "ground_truth": 0}, {"key": "36675623", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9612438079918563, "ground_truth": 0}, {"key": "36675623", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9643214475112667, "ground_truth": 0}, {"key": "36675623", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9681411441550841, "ground_truth": 0}, {"key": "36675623", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9623913673042982, "ground_truth": 0}, {"key": "40035440", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9833429615330381, "ground_truth": 0}, {"key": "40035440", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9575961722153986, "ground_truth": 0}, {"key": "40035440", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9618217270490576, "ground_truth": 0}, {"key": "40035440", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9791955093633378, "ground_truth": 0}, {"key": "40035440", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.979822680732765, "ground_truth": 0}, {"key": "37685909", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.864310449111878, "ground_truth": 0}, {"key": "37685909", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008947840656756, "ground_truth": 0}, {"key": "37685909", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933094062140158, "ground_truth": 0}, {"key": "37685909", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.774583383139183, "ground_truth": 0}, {"key": "37685909", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264255909106686, "ground_truth": 0}, {"key": "36938787", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8418256519472417, "ground_truth": 0}, {"key": "36938787", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9005297862837317, "ground_truth": 0}, {"key": "36938787", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9372107932570809, "ground_truth": 0}, {"key": "36938787", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531276983564, "ground_truth": 0}, {"key": "36938787", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923189067978, "ground_truth": 0}, {"key": "39398068", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6242935366809813, "ground_truth": 0}, {"key": "39398068", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.749087208701596, "ground_truth": 0}, {"key": "39398068", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8459424528908792, "ground_truth": 0}, {"key": "39398068", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743718479868, "ground_truth": 0}, {"key": "39398068", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995869653642, "ground_truth": 0}, {"key": "39926408", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7505527687595404, "ground_truth": 0}, {"key": "39926408", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.81989334723903, "ground_truth": 0}, {"key": "39926408", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6959583218609424, "ground_truth": 0}, {"key": "39926408", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059209815768, "ground_truth": 0}, {"key": "39926408", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321844773192, "ground_truth": 0}, {"key": "40465336", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8354835403621312, "ground_truth": 0}, {"key": "40465336", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8864204168874852, "ground_truth": 0}, {"key": "40465336", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8998277787587193, "ground_truth": 0}, {"key": "40465336", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583463469922, "ground_truth": 0}, {"key": "40465336", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274155003706, "ground_truth": 0}, {"key": "34173549", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9637799437503127, "ground_truth": 0}, {"key": "34173549", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9700134968802279, "ground_truth": 0}, {"key": "34173549", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9791955107524941, "ground_truth": 0}, {"key": "34173549", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9656413113367944, "ground_truth": 0}, {"key": "34173549", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9761291652418694, "ground_truth": 0}, {"key": "33541535", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526220630361, "ground_truth": 0}, {"key": "33541535", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.855851157073473, "ground_truth": 0}, {"key": "33541535", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7892337076553576, "ground_truth": 0}, {"key": "33541535", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762963739672, "ground_truth": 0}, {"key": "33541535", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797717032275, "ground_truth": 0}, {"key": "35685195", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8705972794462302, "ground_truth": 0}, {"key": "35685195", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8479677554854529, "ground_truth": 0}, {"key": "35685195", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9105453978058292, "ground_truth": 0}, {"key": "35685195", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891234289905, "ground_truth": 0}, {"key": "35685195", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531181737149, "ground_truth": 0}, {"key": "28440730", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5660185406753373, "ground_truth": 0}, {"key": "28440730", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7122321889492754, "ground_truth": 0}, {"key": "28440730", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7106283146839886, "ground_truth": 0}, {"key": "28440730", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.596433137015434, "ground_truth": 0}, {"key": "28440730", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982110247441, "ground_truth": 0}, {"key": "38338714", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.969785411525892, "ground_truth": 0}, {"key": "38338714", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.958226120136187, "ground_truth": 0}, {"key": "38338714", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9518632277451606, "ground_truth": 0}, {"key": "38338714", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9525741291584385, "ground_truth": 0}, {"key": "38338714", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9815951095200087, "ground_truth": 0}, {"key": "32191881", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324985825611, "ground_truth": 0}, {"key": "32191881", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7704648054110207, "ground_truth": 0}, {"key": "32191881", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867708135073, "ground_truth": 0}, {"key": "32191881", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317004476591, "ground_truth": 0}, {"key": "32191881", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575432082732, "ground_truth": 0}, {"key": "37707251", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8164063763595538, "ground_truth": 0}, {"key": "37707251", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8449215199813651, "ground_truth": 0}, {"key": "37707251", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8587185779393433, "ground_truth": 0}, {"key": "37707251", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149082696061, "ground_truth": 0}, {"key": "37707251", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357591835508, "ground_truth": 0}, {"key": "40172567", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5214711496727658, "ground_truth": 0}, {"key": "40172567", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6706082868236588, "ground_truth": 0}, {"key": "40172567", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6531268930540841, "ground_truth": 0}, {"key": "40172567", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.38861804578407705, "ground_truth": 0}, {"key": "40172567", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.777299857544744, "ground_truth": 0}, {"key": "33113255", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303065942126, "ground_truth": 0}, {"key": "33113255", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343831074177, "ground_truth": 0}, {"key": "33113255", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8459424255814543, "ground_truth": 0}, {"key": "33113255", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897165945051, "ground_truth": 0}, {"key": "33113255", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.798186777291753, "ground_truth": 0}, {"key": "33022143", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159705027632, "ground_truth": 0}, {"key": "33022143", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5794003748908607, "ground_truth": 0}, {"key": "33022143", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6477982267342424, "ground_truth": 0}, {"key": "33022143", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690619936159, "ground_truth": 0}, {"key": "33022143", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740179996348, "ground_truth": 0}, {"key": "32084473", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9268352817106463, "ground_truth": 0}, {"key": "32084473", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9416541551953445, "ground_truth": 0}, {"key": "32084473", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9284087989232948, "ground_truth": 0}, {"key": "32084473", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9507778908136358, "ground_truth": 0}, {"key": "32084473", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582624449371, "ground_truth": 0}, {"key": "40564245", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210441145100276, "ground_truth": 0}, {"key": "40564245", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9603611613114523, "ground_truth": 0}, {"key": "40564245", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9367494774370189, "ground_truth": 0}, {"key": "40564245", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274065893372, "ground_truth": 0}, {"key": "40564245", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204081181886, "ground_truth": 0}, {"key": "31717213", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7248702758510777, "ground_truth": 0}, {"key": "31717213", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7592254035230863, "ground_truth": 0}, {"key": "31717213", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8278281700846739, "ground_truth": 0}, {"key": "31717213", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068778721796, "ground_truth": 0}, {"key": "31717213", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434844940515, "ground_truth": 0}, {"key": "34861894", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.769080235156027, "ground_truth": 0}, {"key": "34861894", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7505527417956824, "ground_truth": 0}, {"key": "34861894", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7279754508487899, "ground_truth": 0}, {"key": "34861894", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.77321637983669, "ground_truth": 0}, {"key": "34861894", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.626124185695824, "ground_truth": 0}, {"key": "40838760", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8791467591732639, "ground_truth": 0}, {"key": "40838760", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9086179004903988, "ground_truth": 0}, {"key": "40838760", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9019206732964175, "ground_truth": 0}, {"key": "40838760", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036249041914, "ground_truth": 0}, {"key": "40838760", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9441768595857954, "ground_truth": 0}, {"key": "40044849", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8749346196098042, "ground_truth": 0}, {"key": "40044849", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392914541358, "ground_truth": 0}, {"key": "40044849", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416385252338, "ground_truth": 0}, {"key": "40044849", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916002076933, "ground_truth": 0}, {"key": "40044849", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059142480313, "ground_truth": 0}, {"key": "30296116", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7918210695433713, "ground_truth": 0}, {"key": "30296116", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026758195573, "ground_truth": 0}, {"key": "30296116", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148333905365, "ground_truth": 0}, {"key": "30296116", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762864392804, "ground_truth": 0}, {"key": "30296116", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197453039955, "ground_truth": 0}, {"key": "34931360", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6370307916953518, "ground_truth": 0}, {"key": "34931360", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8705972605113463, "ground_truth": 0}, {"key": "34931360", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7563575688300757, "ground_truth": 0}, {"key": "34931360", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026444977578, "ground_truth": 0}, {"key": "34931360", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527965885443, "ground_truth": 0}, {"key": "18862422", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6688802834150035, "ground_truth": 0}, {"key": "18862422", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.778649293766154, "ground_truth": 0}, {"key": "18862422", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.640635836700629, "ground_truth": 0}, {"key": "18862422", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640206444561, "ground_truth": 0}, {"key": "18862422", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241977706694, "ground_truth": 0}, {"key": "36361140", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8233284096399011, "ground_truth": 0}, {"key": "36361140", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8832359865595915, "ground_truth": 0}, {"key": "36361140", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8910549574819704, "ground_truth": 0}, {"key": "36361140", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072425352784, "ground_truth": 0}, {"key": "36361140", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045861196116, "ground_truth": 0}, {"key": "39703329", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5964331125936994, "ground_truth": 0}, {"key": "39703329", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303032642809, "ground_truth": 0}, {"key": "39703329", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.49414087094727804, "ground_truth": 0}, {"key": "39703329", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880025806872, "ground_truth": 0}, {"key": "39703329", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995851108622, "ground_truth": 0}, {"key": "34033324", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9178933752673714, "ground_truth": 0}, {"key": "34033324", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9445872045648294, "ground_truth": 0}, {"key": "34033324", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8509647012085146, "ground_truth": 0}, {"key": "34033324", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759637604826, "ground_truth": 0}, {"key": "34033324", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625182585708, "ground_truth": 0}, {"key": "35658862", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8714748595074832, "ground_truth": 0}, {"key": "35658862", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.834406870405657, "ground_truth": 0}, {"key": "35658862", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8624675366032474, "ground_truth": 0}, {"key": "35658862", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948155518383, "ground_truth": 0}, {"key": "35658862", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338452514296, "ground_truth": 0}, {"key": "36092657", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9190633019934812, "ground_truth": 0}, {"key": "36092657", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9257686333283471, "ground_truth": 0}, {"key": "36092657", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9289263309197583, "ground_truth": 0}, {"key": "36092657", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9289263252185896, "ground_truth": 0}, {"key": "36092657", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823473840493, "ground_truth": 0}, {"key": "26333438", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6095241556566148, "ground_truth": 0}, {"key": "26333438", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7341195343752265, "ground_truth": 0}, {"key": "26333438", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431680081681069, "ground_truth": 0}, {"key": "26333438", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784353561049, "ground_truth": 0}, {"key": "26333438", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898557067494, "ground_truth": 0}, {"key": "34184963", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5832033613640832, "ground_truth": 0}, {"key": "34184963", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.804405935597591, "ground_truth": 0}, {"key": "34184963", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.48828339754890554, "ground_truth": 0}, {"key": "34184963", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684684124939, "ground_truth": 0}, {"key": "34184963", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197716955585, "ground_truth": 0}, {"key": "35069975", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7090191321749458, "ground_truth": 0}, {"key": "35069975", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619253197517, "ground_truth": 0}, {"key": "35069975", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.863391614758411, "ground_truth": 0}, {"key": "35069975", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.842863154444346, "ground_truth": 0}, {"key": "35069975", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585774857578, "ground_truth": 0}, {"key": "36443950", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7217432128214109, "ground_truth": 0}, {"key": "36443950", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7718435040009541, "ground_truth": 0}, {"key": "36443950", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7248702753998516, "ground_truth": 0}, {"key": "36443950", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723949927609, "ground_truth": 0}, {"key": "36443950", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918060945643, "ground_truth": 0}, {"key": "29460858", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185943971804873, "ground_truth": 0}, {"key": "29460858", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5175708936863753, "ground_truth": 0}, {"key": "29460858", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.509764390802754, "ground_truth": 0}, {"key": "29460858", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026946439536, "ground_truth": 0}, {"key": "29460858", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.562176466667983, "ground_truth": 0}, {"key": "36155704", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6297746257753696, "ground_truth": 0}, {"key": "36155704", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5097643539227018, "ground_truth": 0}, {"key": "36155704", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6224593233747612, "ground_truth": 0}, {"key": "36155704", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984683402038, "ground_truth": 0}, {"key": "36155704", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526586097693, "ground_truth": 0}, {"key": "37185211", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8469578430740398, "ground_truth": 0}, {"key": "37185211", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8887587859260092, "ground_truth": 0}, {"key": "37185211", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9219218397991232, "ground_truth": 0}, {"key": "37185211", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942233827867, "ground_truth": 0}, {"key": "37185211", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037266357961, "ground_truth": 0}, {"key": "36454885", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7563575684276033, "ground_truth": 0}, {"key": "36454885", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7634837444719517, "ground_truth": 0}, {"key": "36454885", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.695958326289235, "ground_truth": 0}, {"key": "36454885", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.626124181653775, "ground_truth": 0}, {"key": "36454885", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300854736333, "ground_truth": 0}, {"key": "33148906", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6442251238252991, "ground_truth": 0}, {"key": "33148906", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4205996052621525, "ground_truth": 0}, {"key": "33148906", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6095241591154722, "ground_truth": 0}, {"key": "33148906", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734886211537, "ground_truth": 0}, {"key": "33148906", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935081711978, "ground_truth": 0}, {"key": "18086604", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6842640284763942, "ground_truth": 0}, {"key": "18086604", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6992544134971027, "ground_truth": 0}, {"key": "18086604", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.569852664522854, "ground_truth": 0}, {"key": "18086604", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064367130012, "ground_truth": 0}, {"key": "18086604", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494619180947, "ground_truth": 0}, {"key": "33693397", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673300154234, "ground_truth": 0}, {"key": "33693397", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117839753052, "ground_truth": 0}, {"key": "33693397", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849726738488, "ground_truth": 0}, {"key": "33693397", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059539053087, "ground_truth": 0}, {"key": "33693397", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837794435173, "ground_truth": 0}, {"key": "39501530", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6057990440787072, "ground_truth": 0}, {"key": "39501530", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.42059959776410005, "ground_truth": 0}, {"key": "39501530", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.32423540300304254, "ground_truth": 0}, {"key": "39501530", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552955549529916, "ground_truth": 0}, {"key": "39501530", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591365952061, "ground_truth": 0}, {"key": "30948874", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7839884647335174, "ground_truth": 0}, {"key": "30948874", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760083566393, "ground_truth": 0}, {"key": "30948874", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8255897327306421, "ground_truth": 0}, {"key": "30948874", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179852756989, "ground_truth": 0}, {"key": "30948874", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923185831234, "ground_truth": 0}, {"key": "39410675", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8766343838040541, "ground_truth": 0}, {"key": "39410675", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8354835439877438, "ground_truth": 0}, {"key": "39410675", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.867933839486686, "ground_truth": 0}, {"key": "39410675", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086179043185109, "ground_truth": 0}, {"key": "39410675", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204005076102, "ground_truth": 0}, {"key": "32903337", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6477982154920554, "ground_truth": 0}, {"key": "32903337", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.521471160030189, "ground_truth": 0}, {"key": "32903337", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6992544126831799, "ground_truth": 0}, {"key": "32903337", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026645448376, "ground_truth": 0}, {"key": "32903337", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964205458235, "ground_truth": 0}, {"key": "27685132", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.798186763889315, "ground_truth": 0}, {"key": "27685132", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059536322572, "ground_truth": 0}, {"key": "27685132", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8354835256385414, "ground_truth": 0}, {"key": "27685132", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416401002586, "ground_truth": 0}, {"key": "27685132", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754553042174, "ground_truth": 0}, {"key": "22791471", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8006920012769694, "ground_truth": 0}, {"key": "22791471", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.806852634720389, "ground_truth": 0}, {"key": "22791471", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8832359810200364, "ground_truth": 0}, {"key": "22791471", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357514355423, "ground_truth": 0}, {"key": "22791471", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624671266608, "ground_truth": 0}, {"key": "32292348", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7634837410471056, "ground_truth": 0}, {"key": "32292348", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233284016062786, "ground_truth": 0}, {"key": "32292348", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631549740164, "ground_truth": 0}, {"key": "32292348", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802584622036, "ground_truth": 0}, {"key": "32292348", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281486650367, "ground_truth": 0}, {"key": "20482930", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8344068966549432, "ground_truth": 0}, {"key": "20482930", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7341195211678705, "ground_truth": 0}, {"key": "20482930", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8479677494138962, "ground_truth": 0}, {"key": "20482930", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300812453797, "ground_truth": 0}, {"key": "20482930", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760287241417, "ground_truth": 0}, {"key": "11635754", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585712368697, "ground_truth": 0}, {"key": "11635754", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159585002793, "ground_truth": 0}, {"key": "11635754", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6992544098948346, "ground_truth": 0}, {"key": "11635754", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615381978140125, "ground_truth": 0}, {"key": "11635754", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575579189991, "ground_truth": 0}, {"key": "40029096", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8519528146432486, "ground_truth": 0}, {"key": "40029096", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526168161212, "ground_truth": 0}, {"key": "40029096", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7759445605410006, "ground_truth": 0}, {"key": "40029096", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891479479594, "ground_truth": 0}, {"key": "40029096", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711744951042, "ground_truth": 0}, {"key": "40414719", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9385759589934607, "ground_truth": 0}, {"key": "40414719", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8991213815086708, "ground_truth": 0}, {"key": "40414719", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8816149051025938, "ground_truth": 0}, {"key": "40414719", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.878314246730218, "ground_truth": 0}, {"key": "40414719", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675379911589, "ground_truth": 0}, {"key": "39537616", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437698145512, "ground_truth": 0}, {"key": "39537616", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8198933327243273, "ground_truth": 0}, {"key": "39537616", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8910549466233968, "ground_truth": 0}, {"key": "39537616", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.85681229160633, "ground_truth": 0}, {"key": "39537616", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631371975193, "ground_truth": 0}, {"key": "33245830", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8116760290532794, "ground_truth": 0}, {"key": "33245830", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8661325102943032, "ground_truth": 0}, {"key": "33245830", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430570264463, "ground_truth": 0}, {"key": "33245830", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506431215875, "ground_truth": 0}, {"key": "33245830", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245832517985, "ground_truth": 0}, {"key": "39243601", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8799743690512166, "ground_truth": 0}, {"key": "39243601", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8955226789621191, "ground_truth": 0}, {"key": "39243601", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869924355668, "ground_truth": 0}, {"key": "39243601", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072447637702, "ground_truth": 0}, {"key": "39243601", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531250175313, "ground_truth": 0}, {"key": "35815905", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.729519785763256, "ground_truth": 0}, {"key": "35815905", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9155072410011009, "ground_truth": 0}, {"key": "35815905", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.685949437956871, "ground_truth": 0}, {"key": "35815905", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825942634475, "ground_truth": 0}, {"key": "35815905", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575452738853, "ground_truth": 0}, {"key": "35260212", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9099070011259158, "ground_truth": 0}, {"key": "35260212", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8879840583396831, "ground_truth": 0}, {"key": "35260212", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9142907181571521, "ground_truth": 0}, {"key": "35260212", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206765550207, "ground_truth": 0}, {"key": "35260212", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343700263095, "ground_truth": 0}, {"key": "39193924", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.679178701008952, "ground_truth": 0}, {"key": "39193924", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7606506776255513, "ground_truth": 0}, {"key": "39193924", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6654105664294059, "ground_truth": 0}, {"key": "39193924", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.726425610506801, "ground_truth": 0}, {"key": "39193924", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358499831961, "ground_truth": 0}, {"key": "40658569", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5926665860110322, "ground_truth": 0}, {"key": "40658569", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5964331252669071, "ground_truth": 0}, {"key": "40658569", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.834406884435899, "ground_truth": 0}, {"key": "40658569", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918164739983, "ground_truth": 0}, {"key": "40658569", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506225298342, "ground_truth": 0}, {"key": "33497596", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8940517141380238, "ground_truth": 0}, {"key": "33497596", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672265197859, "ground_truth": 0}, {"key": "33497596", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324986750726, "ground_truth": 0}, {"key": "33497596", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.844921521699878, "ground_truth": 0}, {"key": "33497596", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867766408978, "ground_truth": 0}, {"key": "40339241", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7853085844375052, "ground_truth": 0}, {"key": "40339241", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760182327578, "ground_truth": 0}, {"key": "40339241", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718434899189026, "ground_truth": 0}, {"key": "40339241", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.749087222454216, "ground_truth": 0}, {"key": "40339241", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998686283986, "ground_truth": 0}, {"key": "31792608", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8679338564068019, "ground_truth": 0}, {"key": "31792608", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7170118849450976, "ground_truth": 0}, {"key": "31792608", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.769080242047054, "ground_truth": 0}, {"key": "31792608", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506467397807, "ground_truth": 0}, {"key": "31792608", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089125334591, "ground_truth": 0}, {"key": "33132662", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8322366530328423, "ground_truth": 0}, {"key": "33132662", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8799743641060872, "ground_truth": 0}, {"key": "33132662", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215310495221, "ground_truth": 0}, {"key": "33132662", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581558759922, "ground_truth": 0}, {"key": "33132662", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.869714576533056, "ground_truth": 0}, {"key": "37577457", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7446563372909816, "ground_truth": 0}, {"key": "37577457", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6531269227172036, "ground_truth": 0}, {"key": "37577457", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5813030982239411, "ground_truth": 0}, {"key": "37577457", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056386191728, "ground_truth": 0}, {"key": "37577457", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047086266421, "ground_truth": 0}, {"key": "38701278", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9566341993320691, "ground_truth": 0}, {"key": "38701278", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9462003558149018, "ground_truth": 0}, {"key": "38701278", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9539660983068144, "ground_truth": 0}, {"key": "38701278", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9597620546072188, "ground_truth": 0}, {"key": "38701278", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9594592622288535, "ground_truth": 0}, {"key": "34570783", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9529258235978673, "ground_truth": 0}, {"key": "34570783", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9485372313883249, "ground_truth": 0}, {"key": "34570783", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9299510381706536, "ground_truth": 0}, {"key": "34570783", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274085240431, "ground_truth": 0}, {"key": "34570783", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907245202196, "ground_truth": 0}, {"key": "39064526", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5525397004553347, "ground_truth": 0}, {"key": "39064526", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7057850145959141, "ground_truth": 0}, {"key": "39064526", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6909762915254416, "ground_truth": 0}, {"key": "39064526", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.847967740345046, "ground_truth": 0}, {"key": "39064526", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.690976282640859, "ground_truth": 0}, {"key": "40741545", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036147599498, "ground_truth": 0}, {"key": "40741545", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9149009597960148, "ground_truth": 0}, {"key": "40741545", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210440945951623, "ground_truth": 0}, {"key": "40741545", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343849524213, "ground_truth": 0}, {"key": "40741545", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046904259936, "ground_truth": 0}, {"key": "36929751", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9744347888120024, "ground_truth": 0}, {"key": "36929751", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9811668692220279, "ground_truth": 0}, {"key": "36929751", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9889278390878109, "ground_truth": 0}, {"key": "36929751", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9795114466805279, "ground_truth": 0}, {"key": "36929751", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9865717452347884, "ground_truth": 0}, {"key": "23984730", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.3923368328803472, "ground_truth": 0}, {"key": "23984730", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.4668456060427142, "ground_truth": 0}, {"key": "23984730", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.509764384669085, "ground_truth": 0}, {"key": "23984730", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.464901555308335, "ground_truth": 0}, {"key": "23984730", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397007760023, "ground_truth": 0}, {"key": "36007415", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.935817347548569, "ground_truth": 0}, {"key": "36007415", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9241418268435505, "ground_truth": 0}, {"key": "36007415", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9167080849656567, "ground_truth": 0}, {"key": "36007415", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686278101535, "ground_truth": 0}, {"key": "36007415", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277922678847, "ground_truth": 0}, {"key": "38875041", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9412234442423781, "ground_truth": 0}, {"key": "38875041", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8816148975609681, "ground_truth": 0}, {"key": "38875041", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8661325229574979, "ground_truth": 0}, {"key": "38875041", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942158016002, "ground_truth": 0}, {"key": "38875041", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314825374277, "ground_truth": 0}]