[{"key": "35951548", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.061777287391911045, "res": {"No": 0.9382189866278711, "Yes": 0.061777287391911045}, "ground_truth": 0}, {"key": "35951548", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9938423537903023, "res": {"Yes": 0.9938423537903023, "No": 0.006156535983193701}, "ground_truth": 0}, {"key": "35951548", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9859265825896489, "res": {"Yes": 0.9859265825896489, "No": 0.014072822835663704}, "ground_truth": 1}, {"key": "35951548", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9812611440071959, "res": {"Yes": 0.9812611440071959, "No": 0.01873733540215518}, "ground_truth": 0}, {"key": "35951548", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.05116265538911946, "res": {"No": 0.9487392604691265, "Yes": 0.05116265538911946}, "ground_truth": 0}, {"key": "36266422", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.012170442655079551, "res": {"No": 0.9878293478510884, "Yes": 0.012170442655079551}, "ground_truth": 0}, {"key": "36266422", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989484495670493, "res": {"Yes": 0.9989484495670493, "No": 0.0010511694212826709}, "ground_truth": 0}, {"key": "36266422", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995108316118873, "res": {"Yes": 0.9995108316118873, "No": 0.0004882885675154745}, "ground_truth": 1}, {"key": "36266422", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9712531170378985, "res": {"Yes": 0.9712531170378985, "No": 0.028744802807299734}, "ground_truth": 0}, {"key": "36266422", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9713081060897075, "res": {"Yes": 0.9713081060897075, "No": 0.02869000714349139}, "ground_truth": 0}, {"key": "38826984", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.001401270435387548, "res": {"No": 0.9985985999793877, "Yes": 0.001401270435387548}, "ground_truth": 0}, {"key": "38826984", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995540566323144, "res": {"Yes": 0.9995540566323144, "No": 0.00044536806736375316}, "ground_truth": 0}, {"key": "38826984", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999306706693891, "res": {"Yes": 0.9999306706693891, "No": 6.88648961237666e-05}, "ground_truth": 1}, {"key": "38826984", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996020607688274, "res": {"Yes": 0.9996020607688274, "No": 0.0003973724721996881}, "ground_truth": 0}, {"key": "38826984", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997346464624792, "res": {"Yes": 0.9997346464624792, "No": 0.0002637373068550846}, "ground_truth": 0}, {"key": "34540833", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6268500447696932, "res": {"Yes": 0.6268500447696932, "No": 0.37314734892969637}, "ground_truth": 0}, {"key": "34540833", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974238609560627, "res": {"Yes": 0.9974238609560627, "No": 0.002575801322688333}, "ground_truth": 0}, {"key": "34540833", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.981702338690656, "res": {"Yes": 0.981702338690656, "No": 0.018296783492874624}, "ground_truth": 1}, {"key": "34540833", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9947747235005384, "res": {"Yes": 0.9947747235005384, "No": 0.005224800310226829}, "ground_truth": 0}, {"key": "34540833", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9740760239975831, "res": {"Yes": 0.9740760239975831, "No": 0.02592321706597667}, "ground_truth": 0}, {"key": "20836172", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004204205269378284, "res": {"No": 0.9957953626439416, "Yes": 0.004204205269378284}, "ground_truth": 0}, {"key": "20836172", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6485641237538996, "res": {"Yes": 0.6485641237538996, "No": 0.35143380744088626}, "ground_truth": 0}, {"key": "20836172", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7980118755511609, "res": {"Yes": 0.7980118755511609, "No": 0.20198615975350964}, "ground_truth": 1}, {"key": "20836172", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7157048125530201, "res": {"Yes": 0.7157048125530201, "No": 0.28429268230462745}, "ground_truth": 0}, {"key": "20836172", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8938060532656119, "res": {"Yes": 0.8938060532656119, "No": 0.10619225513492976}, "ground_truth": 0}, {"key": "35932467", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0007233473662069182, "res": {"No": 0.9992755600334334, "Yes": 0.0007233473662069182}, "ground_truth": 0}, {"key": "35932467", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9640468653933707, "res": {"Yes": 0.9640468653933707, "No": 0.03594800464397899}, "ground_truth": 0}, {"key": "35932467", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9113113753550711, "res": {"Yes": 0.9113113753550711, "No": 0.0886685782402835}, "ground_truth": 1}, {"key": "35932467", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9899109513800837, "res": {"Yes": 0.9899109513800837, "No": 0.010087220029217242}, "ground_truth": 0}, {"key": "35932467", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9891166587962512, "res": {"Yes": 0.9891166587962512, "No": 0.010881019912392523}, "ground_truth": 0}, {"key": "40758845", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6650023064409779, "res": {"Yes": 0.6650023064409779, "No": 0.3349970008110443}, "ground_truth": 0}, {"key": "40758845", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9386308247137887, "res": {"Yes": 0.9386308247137887, "No": 0.06136813822084496}, "ground_truth": 0}, {"key": "40758845", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.942754776778972, "res": {"Yes": 0.942754776778972, "No": 0.05724357900246822}, "ground_truth": 1}, {"key": "40758845", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9898310618607957, "res": {"Yes": 0.9898310618607957, "No": 0.010168307536776514}, "ground_truth": 0}, {"key": "40758845", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.14730783001524866, "res": {"No": 0.8526893440743277, "Yes": 0.14730783001524866}, "ground_truth": 0}, {"key": "30358490", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0036072718953052787, "res": {"No": 0.9963919618684756, "Yes": 0.0036072718953052787}, "ground_truth": 0}, {"key": "30358490", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.22172098763853748, "res": {"No": 0.7782519220155948, "Yes": 0.22172098763853748}, "ground_truth": 0}, {"key": "30358490", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9282726643590171, "res": {"Yes": 0.9282726643590171, "No": 0.07168673180750046}, "ground_truth": 1}, {"key": "30358490", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992675938404221, "res": {"Yes": 0.9992675938404221, "No": 0.0007313323137070693}, "ground_truth": 0}, {"key": "30358490", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985053033733617, "res": {"Yes": 0.9985053033733617, "No": 0.0014929966563183943}, "ground_truth": 0}, {"key": "34615665", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8525995520875833, "res": {"Yes": 0.8525995520875833, "No": 0.14739742040861767}, "ground_truth": 0}, {"key": "34615665", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9816407584344349, "res": {"Yes": 0.9816407584344349, "No": 0.018358132768936698}, "ground_truth": 0}, {"key": "34615665", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7764842965282623, "res": {"Yes": 0.7764842965282623, "No": 0.22351020634455698}, "ground_truth": 1}, {"key": "34615665", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2999480158022292, "res": {"No": 0.7000494035003919, "Yes": 0.2999480158022292}, "ground_truth": 0}, {"key": "34615665", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.019231563835289452, "res": {"No": 0.9807667894975034, "Yes": 0.019231563835289452}, "ground_truth": 0}, {"key": "35890902", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9929609748112764, "res": {"Yes": 0.9929609748112764, "No": 0.007038670331623061}, "ground_truth": 0}, {"key": "35890902", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994005603857563, "res": {"Yes": 0.9994005603857563, "No": 0.0005991683185937222}, "ground_truth": 0}, {"key": "35890902", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998375943892193, "res": {"Yes": 0.9998375943892193, "No": 0.00016208219092535698}, "ground_truth": 1}, {"key": "35890902", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9966413871008986, "res": {"Yes": 0.9966413871008986, "No": 0.0033583426017332265}, "ground_truth": 0}, {"key": "35890902", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995002313659682, "res": {"Yes": 0.9995002313659682, "No": 0.0004993899522323099}, "ground_truth": 0}, {"key": "37922330", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9997563213444676, "res": {"Yes": 0.9997563213444676, "No": 0.00024346874036670676}, "ground_truth": 0}, {"key": "37922330", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999253068846696, "res": {"Yes": 0.9999253068846696, "No": 7.460798641375825e-05}, "ground_truth": 0}, {"key": "37922330", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994179465188867, "res": {"Yes": 0.9994179465188867, "No": 0.0005815640185359382}, "ground_truth": 1}, {"key": "37922330", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999243533313535, "res": {"Yes": 0.9999243533313535, "No": 7.551698198861929e-05}, "ground_truth": 0}, {"key": "37922330", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996411227918364, "res": {"Yes": 0.9996411227918364, "No": 0.0003586446831936899}, "ground_truth": 0}, {"key": "30844962", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999667875255465, "res": {"Yes": 0.9999667875255465, "No": 3.3161135009862736e-05}, "ground_truth": 0}, {"key": "30844962", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998350915388954, "res": {"Yes": 0.9998350915388954, "No": 0.00016461584675889614}, "ground_truth": 0}, {"key": "30844962", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999978707566687, "res": {"Yes": 0.999978707566687, "No": 2.1198513429392252e-05}, "ground_truth": 1}, {"key": "30844962", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999893165220688, "res": {"Yes": 0.9999893165220688, "No": 1.0494376664750945e-05}, "ground_truth": 0}, {"key": "30844962", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996506520362156, "res": {"Yes": 0.9996506520362156, "No": 0.000348363668298792}, "ground_truth": 0}, {"key": "36217333", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.009432382152267882, "res": {"No": 0.9905673283992097, "Yes": 0.009432382152267882}, "ground_truth": 0}, {"key": "36217333", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991300110899877, "res": {"Yes": 0.9991300110899877, "No": 0.0008698148370016229}, "ground_truth": 0}, {"key": "36217333", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9906258132207333, "res": {"Yes": 0.9906258132207333, "No": 0.009373750462582153}, "ground_truth": 1}, {"key": "36217333", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987864537435287, "res": {"Yes": 0.9987864537435287, "No": 0.0012133708089273375}, "ground_truth": 0}, {"key": "36217333", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5036856075979427, "res": {"Yes": 0.5036856075979427, "No": 0.4963119591818186}, "ground_truth": 0}, {"key": "30816523", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0009715644020406508, "res": {"No": 0.9990281472251021, "Yes": 0.0009715644020406508}, "ground_truth": 0}, {"key": "30816523", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9939923883007536, "res": {"Yes": 0.9939923883007536, "No": 0.006006755658916024}, "ground_truth": 0}, {"key": "30816523", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9965102147047881, "res": {"Yes": 0.9965102147047881, "No": 0.0034885489599932786}, "ground_truth": 1}, {"key": "30816523", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.948881895163021, "res": {"Yes": 0.948881895163021, "No": 0.05111747825702595}, "ground_truth": 0}, {"key": "30816523", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9819863018119138, "res": {"Yes": 0.9819863018119138, "No": 0.0180115871074216}, "ground_truth": 0}, {"key": "38900884", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3180171076523826, "res": {"No": 0.6819815597458792, "Yes": 0.3180171076523826}, "ground_truth": 0}, {"key": "38900884", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.01633492214641744, "res": {"No": 0.9836540883135096, "Yes": 0.01633492214641744}, "ground_truth": 0}, {"key": "38900884", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00031961385306568266, "res": {"No": 0.9996797206603816, "Yes": 0.00031961385306568266}, "ground_truth": 1}, {"key": "38900884", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0008630787669125207, "res": {"No": 0.9991341721754097, "Yes": 0.0008630787669125207}, "ground_truth": 0}, {"key": "38900884", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.06782709721107232, "res": {"No": 0.9321686646642183, "Yes": 0.06782709721107232}, "ground_truth": 0}, {"key": "13890581", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9469529407581632, "res": {"Yes": 0.9469529407581632, "No": 0.05304571447167762}, "ground_truth": 0}, {"key": "13890581", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997811099699191, "res": {"Yes": 0.9997811099699191, "No": 0.00021880207585656597}, "ground_truth": 0}, {"key": "13890581", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968543347052868, "res": {"Yes": 0.9968543347052868, "No": 0.0031441540736564305}, "ground_truth": 1}, {"key": "13890581", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9643867874971948, "res": {"Yes": 0.9643867874971948, "No": 0.035611893850426804}, "ground_truth": 0}, {"key": "13890581", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9968800404210174, "res": {"Yes": 0.9968800404210174, "No": 0.003118826405521894}, "ground_truth": 0}, {"key": "40194700", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.17071933273001066, "res": {"No": 0.8292790832652521, "Yes": 0.17071933273001066}, "ground_truth": 0}, {"key": "40194700", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974935990811106, "res": {"Yes": 0.9974935990811106, "No": 0.0025058491997431375}, "ground_truth": 0}, {"key": "40194700", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983150546170325, "res": {"Yes": 0.9983150546170325, "No": 0.0016842336933784528}, "ground_truth": 1}, {"key": "40194700", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996435060090888, "res": {"Yes": 0.9996435060090888, "No": 0.0003560255713703065}, "ground_truth": 0}, {"key": "40194700", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995876466410251, "res": {"Yes": 0.9995876466410251, "No": 0.0004118144805305976}, "ground_truth": 0}, {"key": "37903647", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1806874384227173, "res": {"No": 0.8193116848042209, "Yes": 0.1806874384227173}, "ground_truth": 0}, {"key": "37903647", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9883572890628602, "res": {"Yes": 0.9883572890628602, "No": 0.011640929336038814}, "ground_truth": 0}, {"key": "37903647", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997136760385316, "res": {"Yes": 0.9997136760385316, "No": 0.0002861057672356664}, "ground_truth": 1}, {"key": "37903647", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992867497539711, "res": {"Yes": 0.9992867497539711, "No": 0.0007128940828409859}, "ground_truth": 0}, {"key": "37903647", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9938203347611888, "res": {"Yes": 0.9938203347611888, "No": 0.006179409266662768}, "ground_truth": 0}, {"key": "13291223", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996952086283304, "res": {"Yes": 0.9996952086283304, "No": 0.00030463354363831547}, "ground_truth": 0}, {"key": "13291223", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986423550349128, "res": {"Yes": 0.9986423550349128, "No": 0.001357559739671466}, "ground_truth": 0}, {"key": "13291223", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999363920580709, "res": {"Yes": 0.9999363920580709, "No": 6.343955469321737e-05}, "ground_truth": 1}, {"key": "13291223", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999900317366834, "res": {"Yes": 0.9999900317366834, "No": 9.822449763087737e-06}, "ground_truth": 0}, {"key": "13291223", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999553444170902, "res": {"Yes": 0.9999553444170902, "No": 4.455327027033824e-05}, "ground_truth": 0}, {"key": "36052570", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9781799195960714, "res": {"Yes": 0.9781799195960714, "No": 0.02181789444055115}, "ground_truth": 0}, {"key": "36052570", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9808718352457579, "res": {"Yes": 0.9808718352457579, "No": 0.019127312338307098}, "ground_truth": 0}, {"key": "36052570", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.87787448600693, "res": {"Yes": 0.87787448600693, "No": 0.12211669195022587}, "ground_truth": 1}, {"key": "36052570", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.484033916164782, "res": {"No": 0.5159595025555684, "Yes": 0.484033916164782}, "ground_truth": 0}, {"key": "36052570", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9947164532934779, "res": {"Yes": 0.9947164532934779, "No": 0.005280111838258181}, "ground_truth": 0}, {"key": "34944735", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9626860372912791, "res": {"Yes": 0.9626860372912791, "No": 0.0373110145379513}, "ground_truth": 0}, {"key": "34944735", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9684513477868845, "res": {"Yes": 0.9684513477868845, "No": 0.03154419186402394}, "ground_truth": 0}, {"key": "34944735", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9673175255005451, "res": {"Yes": 0.9673175255005451, "No": 0.03267973885484756}, "ground_truth": 1}, {"key": "34944735", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9804201506900284, "res": {"Yes": 0.9804201506900284, "No": 0.01957741447272964}, "ground_truth": 0}, {"key": "34944735", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9524010708500465, "res": {"Yes": 0.9524010708500465, "No": 0.047596673720876004}, "ground_truth": 0}, {"key": "32159602", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996688803322216, "res": {"Yes": 0.9996688803322216, "No": 0.00033069964878902386}, "ground_truth": 0}, {"key": "32159602", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992300949291184, "res": {"Yes": 0.9992300949291184, "No": 0.0007693742775768762}, "ground_truth": 0}, {"key": "32159602", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998983692347562, "res": {"Yes": 0.9998983692347562, "No": 0.00010102010515423432}, "ground_truth": 1}, {"key": "32159602", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996647095724029, "res": {"Yes": 0.9996647095724029, "No": 0.00033471236730880184}, "ground_truth": 0}, {"key": "32159602", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994736772164553, "res": {"Yes": 0.9994736772164553, "No": 0.0005254205859498069}, "ground_truth": 0}, {"key": "34988915", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.02975454457004318, "res": {"No": 0.9702403128134208, "Yes": 0.02975454457004318}, "ground_truth": 0}, {"key": "34988915", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.4927029115858575, "res": {"No": 0.507283352924079, "Yes": 0.4927029115858575}, "ground_truth": 0}, {"key": "34988915", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9478987653829896, "res": {"Yes": 0.9478987653829896, "No": 0.05208975451213063}, "ground_truth": 1}, {"key": "34988915", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8673580687991836, "res": {"Yes": 0.8673580687991836, "No": 0.1326215096275446}, "ground_truth": 0}, {"key": "34988915", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8339313784871512, "res": {"Yes": 0.8339313784871512, "No": 0.16606157926272833}, "ground_truth": 0}, {"key": "37889203", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.40322232266702174, "res": {"No": 0.5967770416008619, "Yes": 0.40322232266702174}, "ground_truth": 0}, {"key": "37889203", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.016446411030696547, "res": {"No": 0.9835532817227315, "Yes": 0.016446411030696547}, "ground_truth": 0}, {"key": "37889203", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994496220635322, "res": {"Yes": 0.9994496220635322, "No": 0.0005499739744715388}, "ground_truth": 1}, {"key": "37889203", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9908111469262602, "res": {"Yes": 0.9908111469262602, "No": 0.009188312343607662}, "ground_truth": 0}, {"key": "37889203", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9579204711100526, "res": {"Yes": 0.9579204711100526, "No": 0.042078935833513034}, "ground_truth": 0}, {"key": "33609927", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5062628136338622, "res": {"Yes": 0.5062628136338622, "No": 0.4937303801309324}, "ground_truth": 0}, {"key": "33609927", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9956535323508869, "res": {"Yes": 0.9956535323508869, "No": 0.004333982559446872}, "ground_truth": 0}, {"key": "33609927", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9907158978935796, "res": {"Yes": 0.9907158978935796, "No": 0.009277414322956997}, "ground_truth": 1}, {"key": "33609927", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994653410810461, "res": {"Yes": 0.9994653410810461, "No": 0.0005323746963977489}, "ground_truth": 0}, {"key": "33609927", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9927073894743225, "res": {"Yes": 0.9927073894743225, "No": 0.007291273914584037}, "ground_truth": 0}, {"key": "33578778", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8357128548151617, "res": {"Yes": 0.8357128548151617, "No": 0.16428062260492984}, "ground_truth": 0}, {"key": "33578778", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5315581392874861, "res": {"Yes": 0.5315581392874861, "No": 0.4684385730440868}, "ground_truth": 0}, {"key": "33578778", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9109331548414261, "res": {"Yes": 0.9109331548414261, "No": 0.08906052359316811}, "ground_truth": 1}, {"key": "33578778", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8935842917466441, "res": {"Yes": 0.8935842917466441, "No": 0.10641406723057475}, "ground_truth": 0}, {"key": "33578778", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8003246028879563, "res": {"Yes": 0.8003246028879563, "No": 0.19967303005184642}, "ground_truth": 0}, {"key": "36888270", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9723955255507546, "res": {"Yes": 0.9723955255507546, "No": 0.027604104597931445}, "ground_truth": 0}, {"key": "36888270", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988996835925147, "res": {"Yes": 0.9988996835925147, "No": 0.0011000754616838685}, "ground_truth": 0}, {"key": "36888270", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9857214188143073, "res": {"Yes": 0.9857214188143073, "No": 0.014276754839960177}, "ground_truth": 1}, {"key": "36888270", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978425509459804, "res": {"Yes": 0.9978425509459804, "No": 0.002157358548164131}, "ground_truth": 0}, {"key": "36888270", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988934990241592, "res": {"Yes": 0.9988934990241592, "No": 0.001106064786822939}, "ground_truth": 0}, {"key": "36846007", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.984669100331359, "res": {"Yes": 0.984669100331359, "No": 0.01532957975064905}, "ground_truth": 0}, {"key": "36846007", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.931583256477536, "res": {"Yes": 0.931583256477536, "No": 0.06841131801406998}, "ground_truth": 0}, {"key": "36846007", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.994702653091021, "res": {"Yes": 0.994702653091021, "No": 0.0052964605620250136}, "ground_truth": 1}, {"key": "36846007", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.986034945819449, "res": {"Yes": 0.986034945819449, "No": 0.013963883956002425}, "ground_truth": 0}, {"key": "36846007", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9900862152838269, "res": {"Yes": 0.9900862152838269, "No": 0.00991241764750195}, "ground_truth": 0}, {"key": "31723471", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7405552620775552, "res": {"Yes": 0.7405552620775552, "No": 0.25944322148208937}, "ground_truth": 0}, {"key": "31723471", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9929344104816566, "res": {"Yes": 0.9929344104816566, "No": 0.007065058377245669}, "ground_truth": 0}, {"key": "31723471", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9701147572878974, "res": {"Yes": 0.9701147572878974, "No": 0.029874428458789737}, "ground_truth": 1}, {"key": "31723471", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7142793261865749, "res": {"Yes": 0.7142793261865749, "No": 0.2857194767601189}, "ground_truth": 0}, {"key": "31723471", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.595835629132498, "res": {"Yes": 0.595835629132498, "No": 0.40416191565019544}, "ground_truth": 0}, {"key": "15921828", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0017962581200940838, "res": {"No": 0.9982035039343341, "Yes": 0.0017962581200940838}, "ground_truth": 0}, {"key": "15921828", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9900121323793065, "res": {"Yes": 0.9900121323793065, "No": 0.00998686049977331}, "ground_truth": 0}, {"key": "15921828", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986938283856844, "res": {"Yes": 0.9986938283856844, "No": 0.0013056794791928596}, "ground_truth": 1}, {"key": "15921828", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992787725096675, "res": {"Yes": 0.9992787725096675, "No": 0.0007210330374666874}, "ground_truth": 0}, {"key": "15921828", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974102244697384, "res": {"Yes": 0.9974102244697384, "No": 0.0025896092069565254}, "ground_truth": 0}, {"key": "39109408", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.556731963175937, "res": {"Yes": 0.556731963175937, "No": 0.4432647312276188}, "ground_truth": 0}, {"key": "39109408", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9954381447153509, "res": {"Yes": 0.9954381447153509, "No": 0.004561321020189757}, "ground_truth": 0}, {"key": "39109408", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9981018443803102, "res": {"Yes": 0.9981018443803102, "No": 0.0018979813594433095}, "ground_truth": 1}, {"key": "39109408", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9200768360323222, "res": {"Yes": 0.9200768360323222, "No": 0.07991901256587583}, "ground_truth": 0}, {"key": "39109408", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9958467919230486, "res": {"Yes": 0.9958467919230486, "No": 0.004153140433301426}, "ground_truth": 0}, {"key": "20936833", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9953105842059844, "res": {"Yes": 0.9953105842059844, "No": 0.004688844978946012}, "ground_truth": 0}, {"key": "20936833", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999180360292298, "res": {"Yes": 0.9999180360292298, "No": 8.161046962471883e-05}, "ground_truth": 0}, {"key": "20936833", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991921245472369, "res": {"Yes": 0.9991921245472369, "No": 0.0008074794113279533}, "ground_truth": 1}, {"key": "20936833", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997345272841192, "res": {"Yes": 0.9997345272841192, "No": 0.00026515765084953754}, "ground_truth": 0}, {"key": "20936833", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9642756965382372, "res": {"Yes": 0.9642756965382372, "No": 0.03572261204812472}, "ground_truth": 0}, {"key": "36832879", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00039119144056081444, "res": {"No": 0.9996072963282799, "Yes": 0.00039119144056081444}, "ground_truth": 0}, {"key": "36832879", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.407837446258426, "res": {"No": 0.5921585494136522, "Yes": 0.407837446258426}, "ground_truth": 0}, {"key": "36832879", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9105422935383348, "res": {"Yes": 0.9105422935383348, "No": 0.08945497973310887}, "ground_truth": 1}, {"key": "36832879", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7609869117652152, "res": {"Yes": 0.7609869117652152, "No": 0.23900798919862662}, "ground_truth": 0}, {"key": "36832879", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9694107929436749, "res": {"Yes": 0.9694107929436749, "No": 0.03058762694491418}, "ground_truth": 0}, {"key": "14958201", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2046809609841169, "res": {"No": 0.7953140109386636, "Yes": 0.2046809609841169}, "ground_truth": 0}, {"key": "14958201", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.013712181234439189, "res": {"No": 0.9862742243944962, "Yes": 0.013712181234439189}, "ground_truth": 0}, {"key": "14958201", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9504576029935837, "res": {"Yes": 0.9504576029935837, "No": 0.04953832334315601}, "ground_truth": 1}, {"key": "14958201", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9870691748865054, "res": {"Yes": 0.9870691748865054, "No": 0.012927385639883696}, "ground_truth": 0}, {"key": "14958201", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6045013352980214, "res": {"Yes": 0.6045013352980214, "No": 0.3954855217118003}, "ground_truth": 0}, {"key": "34352262", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.01920453941554696, "res": {"No": 0.9807944229910824, "Yes": 0.01920453941554696}, "ground_truth": 0}, {"key": "34352262", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.980489140381133, "res": {"Yes": 0.980489140381133, "No": 0.019510794548190873}, "ground_truth": 0}, {"key": "34352262", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997002136449121, "res": {"Yes": 0.9997002136449121, "No": 0.0002995830150553087}, "ground_truth": 1}, {"key": "34352262", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9965435961637579, "res": {"Yes": 0.9965435961637579, "No": 0.0034559219921877723}, "ground_truth": 0}, {"key": "34352262", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9778124238469249, "res": {"Yes": 0.9778124238469249, "No": 0.022187149700890838}, "ground_truth": 0}, {"key": "39805395", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9877321067652479, "res": {"Yes": 0.9877321067652479, "No": 0.01226749742382792}, "ground_truth": 0}, {"key": "39805395", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9966309689639388, "res": {"Yes": 0.9966309689639388, "No": 0.0033681858601318044}, "ground_truth": 0}, {"key": "39805395", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9946186817487399, "res": {"Yes": 0.9946186817487399, "No": 0.005380973355909158}, "ground_truth": 1}, {"key": "39805395", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9969236397236058, "res": {"Yes": 0.9969236397236058, "No": 0.0030761286635847714}, "ground_truth": 0}, {"key": "39805395", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9950468296064081, "res": {"Yes": 0.9950468296064081, "No": 0.004952684134359721}, "ground_truth": 0}, {"key": "34303109", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9938975861261286, "res": {"Yes": 0.9938975861261286, "No": 0.006102278823150138}, "ground_truth": 0}, {"key": "34303109", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980504344764557, "res": {"Yes": 0.9980504344764557, "No": 0.0019494090570526734}, "ground_truth": 0}, {"key": "34303109", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998734658461215, "res": {"Yes": 0.9998734658461215, "No": 0.00012639558571527393}, "ground_truth": 1}, {"key": "34303109", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996182588017198, "res": {"Yes": 0.9996182588017198, "No": 0.000381660151918078}, "ground_truth": 0}, {"key": "34303109", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998311584553382, "res": {"Yes": 0.9998311584553382, "No": 0.00016872034111738724}, "ground_truth": 0}, {"key": "39939090", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.23205701110100735, "res": {"No": 0.767942391281631, "Yes": 0.23205701110100735}, "ground_truth": 0}, {"key": "39939090", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9919951597434947, "res": {"Yes": 0.9919951597434947, "No": 0.008003070487511026}, "ground_truth": 0}, {"key": "39939090", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6830448878329348, "res": {"Yes": 0.6830448878329348, "No": 0.31695182127979205}, "ground_truth": 1}, {"key": "39939090", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8918600708072825, "res": {"Yes": 0.8918600708072825, "No": 0.10813879911502594}, "ground_truth": 0}, {"key": "39939090", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.22287401997594447, "res": {"No": 0.7771089652733045, "Yes": 0.22287401997594447}, "ground_truth": 0}, {"key": "29347771", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998451030377734, "res": {"Yes": 0.9998451030377734, "No": 0.00015481154801669597}, "ground_truth": 0}, {"key": "29347771", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984533674707414, "res": {"Yes": 0.9984533674707414, "No": 0.001546155116132117}, "ground_truth": 0}, {"key": "29347771", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9989026493300779, "res": {"Yes": 0.9989026493300779, "No": 0.001096965003723115}, "ground_truth": 1}, {"key": "29347771", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978944296298445, "res": {"Yes": 0.9978944296298445, "No": 0.002105323798841013}, "ground_truth": 0}, {"key": "29347771", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998095901502569, "res": {"Yes": 0.9998095901502569, "No": 0.000190048738552826}, "ground_truth": 0}, {"key": "36783415", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9043903253035819, "res": {"Yes": 0.9043903253035819, "No": 0.09560426948854378}, "ground_truth": 0}, {"key": "36783415", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9740574709482446, "res": {"Yes": 0.9740574709482446, "No": 0.025936669520255407}, "ground_truth": 0}, {"key": "36783415", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9232565691774387, "res": {"Yes": 0.9232565691774387, "No": 0.07673942400425568}, "ground_truth": 1}, {"key": "36783415", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8213071110400034, "res": {"Yes": 0.8213071110400034, "No": 0.17868776962170185}, "ground_truth": 0}, {"key": "36783415", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8723513342221593, "res": {"Yes": 0.8723513342221593, "No": 0.1276239793228003}, "ground_truth": 0}, {"key": "37935687", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06923980257447813, "res": {"No": 0.9307434440335204, "Yes": 0.06923980257447813}, "ground_truth": 0}, {"key": "37935687", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8400480889780786, "res": {"Yes": 0.8400480889780786, "No": 0.15993565514151453}, "ground_truth": 0}, {"key": "37935687", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9744258901777758, "res": {"Yes": 0.9744258901777758, "No": 0.025572296025171234}, "ground_truth": 1}, {"key": "37935687", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.549387256991123, "res": {"Yes": 0.549387256991123, "No": 0.4506053536031902}, "ground_truth": 0}, {"key": "37935687", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.49870661601255634, "res": {"No": 0.5012872444397513, "Yes": 0.49870661601255634}, "ground_truth": 0}, {"key": "40260829", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8331134263488502, "res": {"Yes": 0.8331134263488502, "No": 0.166886356201374}, "ground_truth": 0}, {"key": "40260829", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.996233870023875, "res": {"Yes": 0.996233870023875, "No": 0.0037658412617273987}, "ground_truth": 0}, {"key": "40260829", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999668403660223, "res": {"Yes": 0.999668403660223, "No": 0.0003315101932308772}, "ground_truth": 1}, {"key": "40260829", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.995992337201426, "res": {"Yes": 0.995992337201426, "No": 0.004007470639080926}, "ground_truth": 0}, {"key": "40260829", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9970261319320982, "res": {"Yes": 0.9970261319320982, "No": 0.0029736027921559026}, "ground_truth": 0}, {"key": "36478199", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8448653866965651, "res": {"Yes": 0.8448653866965651, "No": 0.1551320793618576}, "ground_truth": 0}, {"key": "36478199", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5686217378600281, "res": {"Yes": 0.5686217378600281, "No": 0.4313289952587098}, "ground_truth": 0}, {"key": "36478199", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.715477376237403, "res": {"Yes": 0.715477376237403, "No": 0.28450933898405845}, "ground_truth": 1}, {"key": "36478199", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.968680489173678, "res": {"Yes": 0.968680489173678, "No": 0.0313136398000358}, "ground_truth": 0}, {"key": "36478199", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9585120766934156, "res": {"Yes": 0.9585120766934156, "No": 0.041464800183920944}, "ground_truth": 0}, {"key": "34541803", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3875998833190554, "res": {"No": 0.612393370927507, "Yes": 0.3875998833190554}, "ground_truth": 0}, {"key": "34541803", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.017156176919202865, "res": {"No": 0.9828176437133215, "Yes": 0.017156176919202865}, "ground_truth": 0}, {"key": "34541803", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6036010937775753, "res": {"Yes": 0.6036010937775753, "No": 0.3963771071841032}, "ground_truth": 1}, {"key": "34541803", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7816160215991925, "res": {"Yes": 0.7816160215991925, "No": 0.21838157548552892}, "ground_truth": 0}, {"key": "34541803", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0038778736652008514, "res": {"No": 0.996119353246581, "Yes": 0.0038778736652008514}, "ground_truth": 0}, {"key": "35360841", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9987026306122697, "res": {"Yes": 0.9987026306122697, "No": 0.0012965829176971606}, "ground_truth": 0}, {"key": "35360841", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9830655012759869, "res": {"Yes": 0.9830655012759869, "No": 0.016931559034211032}, "ground_truth": 0}, {"key": "35360841", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993900804366019, "res": {"Yes": 0.9993900804366019, "No": 0.0006097686103834131}, "ground_truth": 1}, {"key": "35360841", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999172016779703, "res": {"Yes": 0.9999172016779703, "No": 8.240619020692956e-05}, "ground_truth": 0}, {"key": "35360841", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999468813708443, "res": {"Yes": 0.9999468813708443, "No": 5.3005069396269965e-05}, "ground_truth": 0}, {"key": "35550407", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0245054680651786, "res": {"No": 0.9754939928104528, "Yes": 0.0245054680651786}, "ground_truth": 0}, {"key": "35550407", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9975290642997403, "res": {"Yes": 0.9975290642997403, "No": 0.0024708452015808242}, "ground_truth": 0}, {"key": "35550407", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.935189145032263, "res": {"Yes": 0.935189145032263, "No": 0.0648095117584593}, "ground_truth": 1}, {"key": "35550407", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9952424497652665, "res": {"Yes": 0.9952424497652665, "No": 0.004757511221975544}, "ground_truth": 0}, {"key": "35550407", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8669778850208365, "res": {"Yes": 0.8669778850208365, "No": 0.13302029079878}, "ground_truth": 0}, {"key": "37561590", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9855784995704748, "res": {"Yes": 0.9855784995704748, "No": 0.01442076640191316}, "ground_truth": 0}, {"key": "37561590", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9901830984747232, "res": {"Yes": 0.9901830984747232, "No": 0.009816074322847111}, "ground_truth": 0}, {"key": "37561590", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.971412938231239, "res": {"Yes": 0.971412938231239, "No": 0.02858647714706431}, "ground_truth": 1}, {"key": "37561590", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978373319437346, "res": {"Yes": 0.9978373319437346, "No": 0.0021619936432215364}, "ground_truth": 0}, {"key": "37561590", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.995753280623651, "res": {"Yes": 0.995753280623651, "No": 0.004245330949784043}, "ground_truth": 0}, {"key": "39328843", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 6.5361189589399045e-06, "res": {"No": 0.9999931310055916, "Yes": 6.5361189589399045e-06}, "ground_truth": 0}, {"key": "39328843", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8469647014431306, "res": {"Yes": 0.8469647014431306, "No": 0.1530340704041006}, "ground_truth": 0}, {"key": "39328843", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9575358187603729, "res": {"Yes": 0.9575358187603729, "No": 0.042462986007131186}, "ground_truth": 1}, {"key": "39328843", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9744744460551928, "res": {"Yes": 0.9744744460551928, "No": 0.02552503356364625}, "ground_truth": 0}, {"key": "39328843", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.990691090678084, "res": {"Yes": 0.990691090678084, "No": 0.00930858673470158}, "ground_truth": 0}, {"key": "35389665", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5830685022284235, "res": {"Yes": 0.5830685022284235, "No": 0.41692447028649}, "ground_truth": 0}, {"key": "35389665", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0079325851519332, "res": {"No": 0.9920671960874474, "Yes": 0.0079325851519332}, "ground_truth": 0}, {"key": "35389665", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9550334910060798, "res": {"Yes": 0.9550334910060798, "No": 0.04496343837538615}, "ground_truth": 1}, {"key": "35389665", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8851002655365062, "res": {"Yes": 0.8851002655365062, "No": 0.11489708090232265}, "ground_truth": 0}, {"key": "35389665", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7223353169456551, "res": {"Yes": 0.7223353169456551, "No": 0.2776618979168425}, "ground_truth": 0}, {"key": "33080187", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0003300405606487089, "res": {"No": 0.9996670928458881, "Yes": 0.0003300405606487089}, "ground_truth": 0}, {"key": "33080187", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5997700183471613, "res": {"Yes": 0.5997700183471613, "No": 0.400228558023261}, "ground_truth": 0}, {"key": "33080187", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8085796168865543, "res": {"Yes": 0.8085796168865543, "No": 0.19141889210528212}, "ground_truth": 1}, {"key": "33080187", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7592376053876507, "res": {"Yes": 0.7592376053876507, "No": 0.24076103341698388}, "ground_truth": 0}, {"key": "33080187", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9876589629724466, "res": {"Yes": 0.9876589629724466, "No": 0.012340040234696004}, "ground_truth": 0}, {"key": "38636995", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.38706464444206096, "res": {"No": 0.6129350395693676, "Yes": 0.38706464444206096}, "ground_truth": 0}, {"key": "38636995", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981084961524069, "res": {"Yes": 0.9981084961524069, "No": 0.0018910992598823169}, "ground_truth": 0}, {"key": "38636995", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994199717814423, "res": {"Yes": 0.9994199717814423, "No": 0.0005798970327067735}, "ground_truth": 1}, {"key": "38636995", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997980296587561, "res": {"Yes": 0.9997980296587561, "No": 0.00020178556173556844}, "ground_truth": 0}, {"key": "38636995", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9934533396696285, "res": {"Yes": 0.9934533396696285, "No": 0.006546462182919546}, "ground_truth": 0}, {"key": "18536236", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9926101197364294, "res": {"Yes": 0.9926101197364294, "No": 0.007388725660209693}, "ground_truth": 0}, {"key": "18536236", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9468721350298784, "res": {"Yes": 0.9468721350298784, "No": 0.053127053413241414}, "ground_truth": 0}, {"key": "18536236", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9851942274697765, "res": {"Yes": 0.9851942274697765, "No": 0.01480423485930255}, "ground_truth": 1}, {"key": "18536236", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9794792569539347, "res": {"Yes": 0.9794792569539347, "No": 0.020520025828121}, "ground_truth": 0}, {"key": "18536236", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992993654590848, "res": {"Yes": 0.9992993654590848, "No": 0.0006999494078729563}, "ground_truth": 0}, {"key": "36289151", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9937844248053819, "res": {"Yes": 0.9937844248053819, "No": 0.006215260749700673}, "ground_truth": 0}, {"key": "36289151", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9877567697561255, "res": {"Yes": 0.9877567697561255, "No": 0.012235884403303466}, "ground_truth": 0}, {"key": "36289151", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9787830154358151, "res": {"Yes": 0.9787830154358151, "No": 0.021213977468598346}, "ground_truth": 1}, {"key": "36289151", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9960790311512863, "res": {"Yes": 0.9960790311512863, "No": 0.003920329000510203}, "ground_truth": 0}, {"key": "36289151", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 1.298228918185342e-05, "res": {"No": 0.9999868132749457, "Yes": 1.298228918185342e-05}, "ground_truth": 0}, {"key": "23017045", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9992143868257488, "res": {"Yes": 0.9992143868257488, "No": 0.0007855040062712004}, "ground_truth": 0}, {"key": "23017045", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988794633705462, "res": {"Yes": 0.9988794633705462, "No": 0.0011203860114208767}, "ground_truth": 0}, {"key": "23017045", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.17293674278357177, "res": {"No": 0.8270611869970348, "Yes": 0.17293674278357177}, "ground_truth": 1}, {"key": "23017045", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974835140728082, "res": {"Yes": 0.9974835140728082, "No": 0.00251631285925224}, "ground_truth": 0}, {"key": "23017045", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 1.996124514513277e-06, "res": {"No": 0.9999974223173222, "Yes": 1.996124514513277e-06}, "ground_truth": 0}, {"key": "36418082", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9104724212037645, "res": {"Yes": 0.9104724212037645, "No": 0.08952594566631086}, "ground_truth": 0}, {"key": "36418082", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9410160059784743, "res": {"Yes": 0.9410160059784743, "No": 0.058980322951477676}, "ground_truth": 0}, {"key": "36418082", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9836832619590747, "res": {"Yes": 0.9836832619590747, "No": 0.01631516884377843}, "ground_truth": 1}, {"key": "36418082", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9619835608268685, "res": {"Yes": 0.9619835608268685, "No": 0.03801567136229874}, "ground_truth": 0}, {"key": "36418082", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7325377526244358, "res": {"Yes": 0.7325377526244358, "No": 0.267456778874913}, "ground_truth": 0}, {"key": "34396551", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8148139777119964, "res": {"Yes": 0.8148139777119964, "No": 0.18518480621709676}, "ground_truth": 0}, {"key": "34396551", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7744107201087089, "res": {"Yes": 0.7744107201087089, "No": 0.2255865680310954}, "ground_truth": 0}, {"key": "34396551", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9435489011489453, "res": {"Yes": 0.9435489011489453, "No": 0.05644510534163095}, "ground_truth": 1}, {"key": "34396551", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9660076592218161, "res": {"Yes": 0.9660076592218161, "No": 0.03399085367888722}, "ground_truth": 0}, {"key": "34396551", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9394385475567173, "res": {"Yes": 0.9394385475567173, "No": 0.060559659039254095}, "ground_truth": 0}, {"key": "39720944", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8936078111947174, "res": {"Yes": 0.8936078111947174, "No": 0.10638844580812866}, "ground_truth": 0}, {"key": "39720944", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.994498760543598, "res": {"Yes": 0.994498760543598, "No": 0.005499810730347128}, "ground_truth": 0}, {"key": "39720944", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9432589421822882, "res": {"Yes": 0.9432589421822882, "No": 0.05673944676508237}, "ground_truth": 1}, {"key": "39720944", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9129727732734594, "res": {"Yes": 0.9129727732734594, "No": 0.08702442087532228}, "ground_truth": 0}, {"key": "39720944", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994587883678789, "res": {"Yes": 0.9994587883678789, "No": 0.0005405899039145907}, "ground_truth": 0}, {"key": "35884842", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.685652664123122, "res": {"Yes": 0.685652664123122, "No": 0.31434367036024313}, "ground_truth": 0}, {"key": "35884842", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7853114957777481, "res": {"Yes": 0.7853114957777481, "No": 0.21468649023377373}, "ground_truth": 0}, {"key": "35884842", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9628545538639948, "res": {"Yes": 0.9628545538639948, "No": 0.03714413476850169}, "ground_truth": 1}, {"key": "35884842", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9691179384411882, "res": {"Yes": 0.9691179384411882, "No": 0.030881178212609866}, "ground_truth": 0}, {"key": "35884842", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.460494116361147, "res": {"No": 0.5394926220016396, "Yes": 0.460494116361147}, "ground_truth": 0}, {"key": "35403375", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9834710679730595, "res": {"Yes": 0.9834710679730595, "No": 0.016526667344974003}, "ground_truth": 0}, {"key": "35403375", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9955004028569171, "res": {"Yes": 0.9955004028569171, "No": 0.004499304723644053}, "ground_truth": 0}, {"key": "35403375", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7094022747959187, "res": {"Yes": 0.7094022747959187, "No": 0.2905966371514921}, "ground_truth": 1}, {"key": "35403375", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9979601924408615, "res": {"Yes": 0.9979601924408615, "No": 0.0020396407287370144}, "ground_truth": 0}, {"key": "35403375", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987375876137813, "res": {"Yes": 0.9987375876137813, "No": 0.0012618466950695757}, "ground_truth": 0}, {"key": "26341324", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5980727660956588, "res": {"Yes": 0.5980727660956588, "No": 0.4019255003700531}, "ground_truth": 0}, {"key": "26341324", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9946101889349994, "res": {"Yes": 0.9946101889349994, "No": 0.005389555311335017}, "ground_truth": 0}, {"key": "26341324", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997172511609895, "res": {"Yes": 0.9997172511609895, "No": 0.0002816946148156586}, "ground_truth": 1}, {"key": "26341324", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996482724706356, "res": {"Yes": 0.9996482724706356, "No": 0.0003508755344820588}, "ground_truth": 0}, {"key": "26341324", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995220166204699, "res": {"Yes": 0.9995220166204699, "No": 0.00047736474247603154}, "ground_truth": 0}, {"key": "19212345", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7247559003444926, "res": {"Yes": 0.7247559003444926, "No": 0.27524375282606056}, "ground_truth": 0}, {"key": "19212345", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9666850418944691, "res": {"Yes": 0.9666850418944691, "No": 0.033314691270247325}, "ground_truth": 0}, {"key": "19212345", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9920470116936123, "res": {"Yes": 0.9920470116936123, "No": 0.007951632702643641}, "ground_truth": 1}, {"key": "19212345", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9874257518831967, "res": {"Yes": 0.9874257518831967, "No": 0.01257388292429847}, "ground_truth": 0}, {"key": "19212345", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9037441486978478, "res": {"Yes": 0.9037441486978478, "No": 0.0962551500723991}, "ground_truth": 0}, {"key": "30548367", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9898567483101313, "res": {"Yes": 0.9898567483101313, "No": 0.010142304889424334}, "ground_truth": 0}, {"key": "30548367", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9553505134975651, "res": {"Yes": 0.9553505134975651, "No": 0.04464673047431487}, "ground_truth": 0}, {"key": "30548367", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9617390499131924, "res": {"Yes": 0.9617390499131924, "No": 0.03825881835700099}, "ground_truth": 1}, {"key": "30548367", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9754426119685728, "res": {"Yes": 0.9754426119685728, "No": 0.024556580889287638}, "ground_truth": 0}, {"key": "30548367", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8843522967495475, "res": {"Yes": 0.8843522967495475, "No": 0.115642574387138}, "ground_truth": 0}, {"key": "37919402", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8203549553565703, "res": {"Yes": 0.8203549553565703, "No": 0.1796431851824312}, "ground_truth": 0}, {"key": "37919402", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9887111853045265, "res": {"Yes": 0.9887111853045265, "No": 0.011284795390277044}, "ground_truth": 0}, {"key": "37919402", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999561788061766, "res": {"Yes": 0.9999561788061766, "No": 4.270438285597734e-05}, "ground_truth": 1}, {"key": "37919402", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996734085725947, "res": {"Yes": 0.9996734085725947, "No": 0.00032612428725699896}, "ground_truth": 0}, {"key": "37919402", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9950700874062752, "res": {"Yes": 0.9950700874062752, "No": 0.004928468442219535}, "ground_truth": 0}, {"key": "39995133", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9986699329243272, "res": {"Yes": 0.9986699329243272, "No": 0.0013298062819846112}, "ground_truth": 0}, {"key": "39995133", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9965215780752061, "res": {"Yes": 0.9965215780752061, "No": 0.003478224209714601}, "ground_truth": 0}, {"key": "39995133", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992794872940292, "res": {"Yes": 0.9992794872940292, "No": 0.0007204917449363357}, "ground_truth": 1}, {"key": "39995133", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9920189718811013, "res": {"Yes": 0.9920189718811013, "No": 0.007980579109824975}, "ground_truth": 0}, {"key": "39995133", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9936950660381763, "res": {"Yes": 0.9936950660381763, "No": 0.0063043166353446934}, "ground_truth": 0}, {"key": "40249088", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9965850355004456, "res": {"Yes": 0.9965850355004456, "No": 0.003414746568455501}, "ground_truth": 0}, {"key": "40249088", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998566603941031, "res": {"Yes": 0.9998566603941031, "No": 0.00014261141558463214}, "ground_truth": 0}, {"key": "40249088", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991827261203712, "res": {"Yes": 0.9991827261203712, "No": 0.0008168154304075152}, "ground_truth": 1}, {"key": "40249088", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990156687721268, "res": {"Yes": 0.9990156687721268, "No": 0.000981393556451487}, "ground_truth": 0}, {"key": "40249088", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9046316090297086, "res": {"Yes": 0.9046316090297086, "No": 0.09536782705662475}, "ground_truth": 0}, {"key": "40254388", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9991832025607841, "res": {"Yes": 0.9991832025607841, "No": 0.0008165198783866149}, "ground_truth": 0}, {"key": "40254388", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9830254097331805, "res": {"Yes": 0.9830254097331805, "No": 0.01697457911921476}, "ground_truth": 0}, {"key": "40254388", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999305514716607, "res": {"Yes": 0.9999305514716607, "No": 6.919748776317627e-05}, "ground_truth": 1}, {"key": "40254388", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999621387467553, "res": {"Yes": 0.9999621387467553, "No": 3.777379310068211e-05}, "ground_truth": 0}, {"key": "40254388", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978166759269269, "res": {"Yes": 0.9978166759269269, "No": 0.002182831481992243}, "ground_truth": 0}, {"key": "31995230", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8523259030297596, "res": {"Yes": 0.8523259030297596, "No": 0.14767142125623087}, "ground_truth": 0}, {"key": "31995230", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9917485189094549, "res": {"Yes": 0.9917485189094549, "No": 0.008249588159023186}, "ground_truth": 0}, {"key": "31995230", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994964224377642, "res": {"Yes": 0.9994964224377642, "No": 0.0005030686077743887}, "ground_truth": 1}, {"key": "31995230", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992085504615368, "res": {"Yes": 0.9992085504615368, "No": 0.00079103843577932}, "ground_truth": 0}, {"key": "31995230", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9477386532122647, "res": {"Yes": 0.9477386532122647, "No": 0.052236541513776845}, "ground_truth": 0}, {"key": "38632129", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9303375701869687, "res": {"Yes": 0.9303375701869687, "No": 0.06966043287166962}, "ground_truth": 0}, {"key": "38632129", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9821052923728187, "res": {"Yes": 0.9821052923728187, "No": 0.017893508241285692}, "ground_truth": 0}, {"key": "38632129", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9848773040353086, "res": {"Yes": 0.9848773040353086, "No": 0.015121445665556609}, "ground_truth": 1}, {"key": "38632129", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8215673998609602, "res": {"Yes": 0.8215673998609602, "No": 0.17842761111285982}, "ground_truth": 0}, {"key": "38632129", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8111831970950282, "res": {"Yes": 0.8111831970950282, "No": 0.18881295689569524}, "ground_truth": 0}, {"key": "35720795", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9975364186098766, "res": {"Yes": 0.9975364186098766, "No": 0.0024631745339787742}, "ground_truth": 0}, {"key": "35720795", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7521697643836022, "res": {"Yes": 0.7521697643836022, "No": 0.24782741062115568}, "ground_truth": 0}, {"key": "35720795", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9704695125834444, "res": {"Yes": 0.9704695125834444, "No": 0.02952388742739717}, "ground_truth": 1}, {"key": "35720795", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8635115376420105, "res": {"Yes": 0.8635115376420105, "No": 0.13648253790178344}, "ground_truth": 0}, {"key": "35720795", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9933559386296685, "res": {"Yes": 0.9933559386296685, "No": 0.006641320930251184}, "ground_truth": 0}, {"key": "23906759", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.006753524920214174, "res": {"No": 0.9932457283264242, "Yes": 0.006753524920214174}, "ground_truth": 0}, {"key": "23906759", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6626782305883141, "res": {"Yes": 0.6626782305883141, "No": 0.33732089196825715}, "ground_truth": 0}, {"key": "23906759", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.028799337372621775, "res": {"No": 0.9711971142552956, "Yes": 0.028799337372621775}, "ground_truth": 1}, {"key": "23906759", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.009351212172191101, "res": {"No": 0.9906479212636986, "Yes": 0.009351212172191101}, "ground_truth": 0}, {"key": "23906759", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.004074370592691746, "res": {"No": 0.9959239939545559, "Yes": 0.004074370592691746}, "ground_truth": 0}, {"key": "19410108", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.23379540118617634, "res": {"No": 0.7661996910035462, "Yes": 0.23379540118617634}, "ground_truth": 0}, {"key": "19410108", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9951779791519073, "res": {"Yes": 0.9951779791519073, "No": 0.004821954187471693}, "ground_truth": 0}, {"key": "19410108", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997671662999741, "res": {"Yes": 0.9997671662999741, "No": 0.000232612169457158}, "ground_truth": 1}, {"key": "19410108", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999597547668612, "res": {"Yes": 0.9999597547668612, "No": 4.014261779924514e-05}, "ground_truth": 0}, {"key": "19410108", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996151606896513, "res": {"Yes": 0.9996151606896513, "No": 0.00038462604784380276}, "ground_truth": 0}, {"key": "30745137", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.005141634263259412, "res": {"No": 0.9948573104402166, "Yes": 0.005141634263259412}, "ground_truth": 0}, {"key": "30745137", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.38336769928599834, "res": {"No": 0.6166267631974561, "Yes": 0.38336769928599834}, "ground_truth": 0}, {"key": "30745137", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.873584488488683, "res": {"Yes": 0.873584488488683, "No": 0.1264089490916315}, "ground_truth": 1}, {"key": "30745137", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9482272786974696, "res": {"Yes": 0.9482272786974696, "No": 0.05177058231577225}, "ground_truth": 0}, {"key": "30745137", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9476566441962853, "res": {"Yes": 0.9476566441962853, "No": 0.05234253236886626}, "ground_truth": 0}, {"key": "26553115", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.18490707082011212, "res": {"No": 0.8150923657127461, "Yes": 0.18490707082011212}, "ground_truth": 0}, {"key": "26553115", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9958378026537995, "res": {"Yes": 0.9958378026537995, "No": 0.004161841226935043}, "ground_truth": 0}, {"key": "26553115", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9989510693127934, "res": {"Yes": 0.9989510693127934, "No": 0.0010487649974240056}, "ground_truth": 1}, {"key": "26553115", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9977146166741402, "res": {"Yes": 0.9977146166741402, "No": 0.002285174248486733}, "ground_truth": 0}, {"key": "26553115", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997221371310395, "res": {"Yes": 0.9997221371310395, "No": 0.0002777300386705442}, "ground_truth": 0}, {"key": "37872311", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.25055064581260017, "res": {"No": 0.7494484372526354, "Yes": 0.25055064581260017}, "ground_truth": 0}, {"key": "37872311", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8531702002792517, "res": {"Yes": 0.8531702002792517, "No": 0.1468229999008602}, "ground_truth": 0}, {"key": "37872311", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993398450981942, "res": {"Yes": 0.9993398450981942, "No": 0.000659603276425254}, "ground_truth": 1}, {"key": "37872311", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9947755541377793, "res": {"Yes": 0.9947755541377793, "No": 0.0052210591258297695}, "ground_truth": 0}, {"key": "37872311", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994057985076705, "res": {"Yes": 0.9994057985076705, "No": 0.0005926357483841929}, "ground_truth": 0}, {"key": "35553131", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.998166453004852, "res": {"Yes": 0.998166453004852, "No": 0.0018333794888359962}, "ground_truth": 0}, {"key": "35553131", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997129610535632, "res": {"Yes": 0.9997129610535632, "No": 0.00028700067221352246}, "ground_truth": 0}, {"key": "35553131", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993141291170383, "res": {"Yes": 0.9993141291170383, "No": 0.0006857617457270955}, "ground_truth": 1}, {"key": "35553131", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997129610535632, "res": {"Yes": 0.9997129610535632, "No": 0.0002868945016075767}, "ground_truth": 0}, {"key": "35553131", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9959335697102003, "res": {"Yes": 0.9959335697102003, "No": 0.004065156651786654}, "ground_truth": 0}, {"key": "39038936", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9823862677052662, "res": {"Yes": 0.9823862677052662, "No": 0.017613271475346994}, "ground_truth": 0}, {"key": "39038936", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9517575814037587, "res": {"Yes": 0.9517575814037587, "No": 0.04824098056337482}, "ground_truth": 0}, {"key": "39038936", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998346147876424, "res": {"Yes": 0.9998346147876424, "No": 0.00016508435042375202}, "ground_truth": 1}, {"key": "39038936", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992237856103722, "res": {"Yes": 0.9992237856103722, "No": 0.0007759837334885906}, "ground_truth": 0}, {"key": "39038936", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997907597337986, "res": {"Yes": 0.9997907597337986, "No": 0.00020819841805731496}, "ground_truth": 0}, {"key": "38735486", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.03282407627788671, "res": {"No": 0.967170987995928, "Yes": 0.03282407627788671}, "ground_truth": 0}, {"key": "38735486", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9912784453509222, "res": {"Yes": 0.9912784453509222, "No": 0.008721003215758484}, "ground_truth": 0}, {"key": "38735486", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988274861321778, "res": {"Yes": 0.9988274861321778, "No": 0.001172253868425027}, "ground_truth": 1}, {"key": "38735486", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998143049869289, "res": {"Yes": 0.998143049869289, "No": 0.0018557970475084216}, "ground_truth": 0}, {"key": "38735486", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990476631608393, "res": {"Yes": 0.9990476631608393, "No": 0.0009518104025429462}, "ground_truth": 0}, {"key": "17087845", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0009129243860694919, "res": {"No": 0.9990865698315521, "Yes": 0.0009129243860694919}, "ground_truth": 0}, {"key": "17087845", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5942240750673556, "res": {"Yes": 0.5942240750673556, "No": 0.40577474038158723}, "ground_truth": 0}, {"key": "17087845", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9231528286655301, "res": {"Yes": 0.9231528286655301, "No": 0.07684532835345884}, "ground_truth": 1}, {"key": "17087845", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9925901542794943, "res": {"Yes": 0.9925901542794943, "No": 0.007409576454090512}, "ground_truth": 0}, {"key": "17087845", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8814904156297279, "res": {"Yes": 0.8814904156297279, "No": 0.11850800120133487}, "ground_truth": 0}, {"key": "37443011", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8285761029727639, "res": {"Yes": 0.8285761029727639, "No": 0.17142130168466643}, "ground_truth": 0}, {"key": "37443011", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994242570036421, "res": {"Yes": 0.9994242570036421, "No": 0.0005751057620964154}, "ground_truth": 0}, {"key": "37443011", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6615181421688215, "res": {"Yes": 0.6615181421688215, "No": 0.3384792799083696}, "ground_truth": 1}, {"key": "37443011", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989555905755648, "res": {"Yes": 0.9989555905755648, "No": 0.001044059289944152}, "ground_truth": 0}, {"key": "37443011", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8140245367551954, "res": {"Yes": 0.8140245367551954, "No": 0.18597407438701097}, "ground_truth": 0}, {"key": "36855749", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9984657237071558, "res": {"Yes": 0.9984657237071558, "No": 0.001533428194638863}, "ground_truth": 0}, {"key": "36855749", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9780938063829832, "res": {"Yes": 0.9780938063829832, "No": 0.021899015445428927}, "ground_truth": 0}, {"key": "36855749", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9849137264563538, "res": {"Yes": 0.9849137264563538, "No": 0.015080185732490873}, "ground_truth": 1}, {"key": "36855749", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9822291426766173, "res": {"Yes": 0.9822291426766173, "No": 0.017763412759441405}, "ground_truth": 0}, {"key": "36855749", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9690256895880663, "res": {"Yes": 0.9690256895880663, "No": 0.03096966196420272}, "ground_truth": 0}, {"key": "35613141", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996124200785106, "res": {"Yes": 0.9996124200785106, "No": 0.0003870831616635913}, "ground_truth": 0}, {"key": "35613141", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980040056513704, "res": {"Yes": 0.9980040056513704, "No": 0.001995453971281194}, "ground_truth": 0}, {"key": "35613141", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9863316232794357, "res": {"Yes": 0.9863316232794357, "No": 0.01366806758472432}, "ground_truth": 1}, {"key": "35613141", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.921353085791755, "res": {"Yes": 0.921353085791755, "No": 0.07864618945874503}, "ground_truth": 0}, {"key": "35613141", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985222949828305, "res": {"Yes": 0.9985222949828305, "No": 0.0014775715255618566}, "ground_truth": 0}, {"key": "39088847", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8950677099441374, "res": {"Yes": 0.8950677099441374, "No": 0.10493218443578398}, "ground_truth": 0}, {"key": "39088847", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9977268410478263, "res": {"Yes": 0.9977268410478263, "No": 0.002272717561185083}, "ground_truth": 0}, {"key": "39088847", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994968953496083, "res": {"Yes": 0.9994968953496083, "No": 0.00050302484270932}, "ground_truth": 1}, {"key": "39088847", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998967005557551, "res": {"Yes": 0.9998967005557551, "No": 0.00010321823755870062}, "ground_truth": 0}, {"key": "39088847", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993959178311462, "res": {"Yes": 0.9993959178311462, "No": 0.0006038900578650286}, "ground_truth": 0}, {"key": "33197277", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8103935865584043, "res": {"Yes": 0.8103935865584043, "No": 0.18960236795975335}, "ground_truth": 0}, {"key": "33197277", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9841471740401064, "res": {"Yes": 0.9841471740401064, "No": 0.015848871181941185}, "ground_truth": 0}, {"key": "33197277", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991460786685078, "res": {"Yes": 0.9991460786685078, "No": 0.000853456912762989}, "ground_truth": 1}, {"key": "33197277", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9900217127730663, "res": {"Yes": 0.9900217127730663, "No": 0.009977587014569845}, "ground_truth": 0}, {"key": "33197277", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9421530539028081, "res": {"Yes": 0.9421530539028081, "No": 0.05783547137074893}, "ground_truth": 0}, {"key": "33815489", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9973007754751656, "res": {"Yes": 0.9973007754751656, "No": 0.0026991464110809765}, "ground_truth": 0}, {"key": "33815489", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9966946780435862, "res": {"Yes": 0.9966946780435862, "No": 0.003304990103782218}, "ground_truth": 0}, {"key": "33815489", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996798398322082, "res": {"Yes": 0.9996798398322082, "No": 0.00032001522025651224}, "ground_truth": 1}, {"key": "33815489", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993828244812086, "res": {"Yes": 0.9993828244812086, "No": 0.0006170904181388398}, "ground_truth": 0}, {"key": "33815489", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9867152901391018, "res": {"Yes": 0.9867152901391018, "No": 0.013284172367230356}, "ground_truth": 0}, {"key": "35862754", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9622510554139703, "res": {"Yes": 0.9622510554139703, "No": 0.037748603399923114}, "ground_truth": 0}, {"key": "35862754", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9925973277544606, "res": {"Yes": 0.9925973277544606, "No": 0.007401830089174672}, "ground_truth": 0}, {"key": "35862754", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9956401717657793, "res": {"Yes": 0.9956401717657793, "No": 0.004359259829102693}, "ground_truth": 1}, {"key": "35862754", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9810146458671821, "res": {"Yes": 0.9810146458671821, "No": 0.018982021208103817}, "ground_truth": 0}, {"key": "35862754", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9401039111979498, "res": {"Yes": 0.9401039111979498, "No": 0.05989513475185326}, "ground_truth": 0}, {"key": "36080615", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0017585343017238863, "res": {"No": 0.9982414000522081, "Yes": 0.0017585343017238863}, "ground_truth": 0}, {"key": "36080615", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9727904255260013, "res": {"Yes": 0.9727904255260013, "No": 0.02720906742552932}, "ground_truth": 0}, {"key": "36080615", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996828189725412, "res": {"Yes": 0.9996828189725412, "No": 0.00031701261180645}, "ground_truth": 1}, {"key": "36080615", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.995055567150981, "res": {"Yes": 0.995055567150981, "No": 0.004944213381844061}, "ground_truth": 0}, {"key": "36080615", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.997545790508554, "res": {"Yes": 0.997545790508554, "No": 0.002453763526024008}, "ground_truth": 0}, {"key": "22822742", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9766485913114847, "res": {"Yes": 0.9766485913114847, "No": 0.023350485565198458}, "ground_truth": 0}, {"key": "22822742", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9269249053037045, "res": {"Yes": 0.9269249053037045, "No": 0.07307110286691315}, "ground_truth": 0}, {"key": "22822742", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993378199980104, "res": {"Yes": 0.9993378199980104, "No": 0.0006606495765922249}, "ground_truth": 1}, {"key": "22822742", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997296412535144, "res": {"Yes": 0.9997296412535144, "No": 0.0002696577488225524}, "ground_truth": 0}, {"key": "22822742", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6006924775567024, "res": {"Yes": 0.6006924775567024, "No": 0.39927832854586087}, "ground_truth": 0}, {"key": "39747536", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9527355309130062, "res": {"Yes": 0.9527355309130062, "No": 0.0472621365416699}, "ground_truth": 0}, {"key": "39747536", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.383772350281815, "res": {"No": 0.6162212240309244, "Yes": 0.383772350281815}, "ground_truth": 0}, {"key": "39747536", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6750550337173519, "res": {"Yes": 0.6750550337173519, "No": 0.32493572026961237}, "ground_truth": 1}, {"key": "39747536", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5058920613197486, "res": {"Yes": 0.5058920613197486, "No": 0.49409391427222543}, "ground_truth": 0}, {"key": "39747536", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.2404008597491261, "res": {"No": 0.7595753590091057, "Yes": 0.2404008597491261}, "ground_truth": 0}, {"key": "34218396", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9655086577869675, "res": {"Yes": 0.9655086577869675, "No": 0.034490664009023286}, "ground_truth": 0}, {"key": "34218396", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9690362161713073, "res": {"Yes": 0.9690362161713073, "No": 0.03096219917497157}, "ground_truth": 0}, {"key": "34218396", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9585339856543382, "res": {"Yes": 0.9585339856543382, "No": 0.04146416577733134}, "ground_truth": 1}, {"key": "34218396", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971543694041133, "res": {"Yes": 0.9971543694041133, "No": 0.002844842708292193}, "ground_truth": 0}, {"key": "34218396", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978489633023848, "res": {"Yes": 0.9978489633023848, "No": 0.0021506503375495764}, "ground_truth": 0}, {"key": "39150388", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.13794006496685743, "res": {"No": 0.8620587975757178, "Yes": 0.13794006496685743}, "ground_truth": 0}, {"key": "39150388", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999661915245194, "res": {"Yes": 0.9999661915245194, "No": 3.3725915844166326e-05}, "ground_truth": 0}, {"key": "39150388", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.1805923453968426e-06}, "ground_truth": 1}, {"key": "39150388", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999928926002577, "res": {"Yes": 0.9999928926002577, "No": 6.745479372748131e-06}, "ground_truth": 0}, {"key": "39150388", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7042089449891371, "res": {"Yes": 0.7042089449891371, "No": 0.2957904247260513}, "ground_truth": 0}, {"key": "28765782", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998695326316075, "res": {"Yes": 0.9998695326316075, "No": 0.0001298760531015361}, "ground_truth": 0}, {"key": "28765782", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9877342007595339, "res": {"Yes": 0.9877342007595339, "No": 0.01226546609445324}, "ground_truth": 0}, {"key": "28765782", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9979723045576262, "res": {"Yes": 0.9979723045576262, "No": 0.0020276637717927125}, "ground_truth": 1}, {"key": "28765782", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993697276051425, "res": {"Yes": 0.9993697276051425, "No": 0.000630231087676371}, "ground_truth": 0}, {"key": "28765782", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981789208804327, "res": {"Yes": 0.9981789208804327, "No": 0.0018208981693162713}, "ground_truth": 0}, {"key": "35828022", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9974233851849945, "res": {"Yes": 0.9974233851849945, "No": 0.002576026199959553}, "ground_truth": 0}, {"key": "35828022", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9638087173944403, "res": {"Yes": 0.9638087173944403, "No": 0.03618813414260163}, "ground_truth": 0}, {"key": "35828022", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.22497304139015234, "res": {"No": 0.7750256758876263, "Yes": 0.22497304139015234}, "ground_truth": 1}, {"key": "35828022", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9921658769586713, "res": {"Yes": 0.9921658769586713, "No": 0.007833684638795064}, "ground_truth": 0}, {"key": "35828022", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5717989873968033, "res": {"Yes": 0.5717989873968033, "No": 0.4282004722305911}, "ground_truth": 0}, {"key": "27717735", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9975003583201376, "res": {"Yes": 0.9975003583201376, "No": 0.002499573904085628}, "ground_truth": 0}, {"key": "27717735", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989108581459988, "res": {"Yes": 0.9989108581459988, "No": 0.0010890647266725978}, "ground_truth": 0}, {"key": "27717735", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9981587298216172, "res": {"Yes": 0.9981587298216172, "No": 0.001841264527864926}, "ground_truth": 1}, {"key": "27717735", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9926083697663309, "res": {"Yes": 0.9926083697663309, "No": 0.007391445211619418}, "ground_truth": 0}, {"key": "27717735", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9908395865867602, "res": {"Yes": 0.9908395865867602, "No": 0.009160335264847618}, "ground_truth": 0}, {"key": "37977826", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.11392895803198656, "res": {"No": 0.8860692953317741, "Yes": 0.11392895803198656}, "ground_truth": 0}, {"key": "37977826", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7393439056833155, "res": {"Yes": 0.7393439056833155, "No": 0.26061055823821516}, "ground_truth": 0}, {"key": "37977826", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9664470472382161, "res": {"Yes": 0.9664470472382161, "No": 0.033548393515650275}, "ground_truth": 1}, {"key": "37977826", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9942620641976373, "res": {"Yes": 0.9942620641976373, "No": 0.005737199957224679}, "ground_truth": 0}, {"key": "37977826", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9960401176934734, "res": {"Yes": 0.9960401176934734, "No": 0.00395912990031845}, "ground_truth": 0}, {"key": "31768588", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9990904999461218, "res": {"Yes": 0.9990904999461218, "No": 0.0009089871502730201}, "ground_truth": 0}, {"key": "31768588", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990399260661719, "res": {"Yes": 0.9990399260661719, "No": 0.0009597075071297236}, "ground_truth": 0}, {"key": "31768588", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9828520694698398, "res": {"Yes": 0.9828520694698398, "No": 0.017146309809167586}, "ground_truth": 1}, {"key": "31768588", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9970943830996432, "res": {"Yes": 0.9970943830996432, "No": 0.0029011542614194655}, "ground_truth": 0}, {"key": "31768588", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.951396086884583, "res": {"Yes": 0.951396086884583, "No": 0.04860180543001239}, "ground_truth": 0}, {"key": "37183351", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9997154636081595, "res": {"Yes": 0.9997154636081595, "No": 0.00028447931885292277}, "ground_truth": 0}, {"key": "37183351", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999306706693891, "res": {"Yes": 0.9999306706693891, "No": 6.919700338245726e-05}, "ground_truth": 0}, {"key": "37183351", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992164080686312, "res": {"Yes": 0.9992164080686312, "No": 0.0007833120578927008}, "ground_truth": 1}, {"key": "37183351", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993253229669699, "res": {"Yes": 0.9993253229669699, "No": 0.0006744425905657681}, "ground_truth": 0}, {"key": "37183351", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996720977516971, "res": {"Yes": 0.9996720977516971, "No": 0.0003277993088850884}, "ground_truth": 0}, {"key": "39622090", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.03385019225581339, "res": {"No": 0.9661474013702522, "Yes": 0.03385019225581339}, "ground_truth": 0}, {"key": "39622090", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 9.053790094103047e-05, "res": {"No": 0.9999083813732428, "Yes": 9.053790094103047e-05}, "ground_truth": 0}, {"key": "39622090", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.17739111409807437, "res": {"No": 0.8226078173577949, "Yes": 0.17739111409807437}, "ground_truth": 1}, {"key": "39622090", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.018308094399783467, "res": {"No": 0.9816913073634558, "Yes": 0.018308094399783467}, "ground_truth": 0}, {"key": "39622090", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.00039936371095952516, "res": {"No": 0.9995993201936023, "Yes": 0.00039936371095952516}, "ground_truth": 0}, {"key": "39272756", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3925617418712885, "res": {"No": 0.6074365825990423, "Yes": 0.3925617418712885}, "ground_truth": 0}, {"key": "39272756", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9959950572602131, "res": {"Yes": 0.9959950572602131, "No": 0.004004303184464811}, "ground_truth": 0}, {"key": "39272756", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9810048877630317, "res": {"Yes": 0.9810048877630317, "No": 0.01899349361078159}, "ground_truth": 1}, {"key": "39272756", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9513312371805857, "res": {"Yes": 0.9513312371805857, "No": 0.048666951170004566}, "ground_truth": 0}, {"key": "39272756", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9953376267637991, "res": {"Yes": 0.9953376267637991, "No": 0.004659801165977824}, "ground_truth": 0}, {"key": "32138822", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7402099032243139, "res": {"Yes": 0.7402099032243139, "No": 0.25978754931727016}, "ground_truth": 0}, {"key": "32138822", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991356014078913, "res": {"Yes": 0.9991356014078913, "No": 0.0008637222592851464}, "ground_truth": 0}, {"key": "32138822", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997397708854714, "res": {"Yes": 0.9997397708854714, "No": 0.0002597468643130145}, "ground_truth": 1}, {"key": "32138822", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984923443563763, "res": {"Yes": 0.9984923443563763, "No": 0.001507203246726584}, "ground_truth": 0}, {"key": "32138822", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987554238281279, "res": {"Yes": 0.9987554238281279, "No": 0.0012442832719705642}, "ground_truth": 0}, {"key": "31070114", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7715102588417446, "res": {"Yes": 0.7715102588417446, "No": 0.22848728858961978}, "ground_truth": 0}, {"key": "31070114", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.998673976846674, "res": {"Yes": 0.998673976846674, "No": 0.001325809583125162}, "ground_truth": 0}, {"key": "31070114", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9965640743485178, "res": {"Yes": 0.9965640743485178, "No": 0.003434753902428522}, "ground_truth": 1}, {"key": "31070114", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995523885079278, "res": {"Yes": 0.9995523885079278, "No": 0.0004474310993663778}, "ground_truth": 0}, {"key": "31070114", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994323545216897, "res": {"Yes": 0.9994323545216897, "No": 0.000567379026781129}, "ground_truth": 0}, {"key": "39652762", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9591532020315037, "res": {"Yes": 0.9591532020315037, "No": 0.04084536205937597}, "ground_truth": 0}, {"key": "39652762", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9970364463204873, "res": {"Yes": 0.9970364463204873, "No": 0.0029608215455011965}, "ground_truth": 0}, {"key": "39652762", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.974856317997655, "res": {"Yes": 0.974856317997655, "No": 0.02513790280359536}, "ground_truth": 1}, {"key": "39652762", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6953020107251001, "res": {"Yes": 0.6953020107251001, "No": 0.30469612819879693}, "ground_truth": 0}, {"key": "39652762", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.051350089482976674, "res": {"No": 0.9486363733781064, "Yes": 0.051350089482976674}, "ground_truth": 0}, {"key": "33258866", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9863484403769779, "res": {"Yes": 0.9863484403769779, "No": 0.013650942665392057}, "ground_truth": 0}, {"key": "33258866", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9852365789243072, "res": {"Yes": 0.9852365789243072, "No": 0.014762575251425214}, "ground_truth": 0}, {"key": "33258866", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995424991054646, "res": {"Yes": 0.9995424991054646, "No": 0.0004566935321568752}, "ground_truth": 1}, {"key": "33258866", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9834296833978063, "res": {"Yes": 0.9834296833978063, "No": 0.016569714129264532}, "ground_truth": 0}, {"key": "33258866", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999184866352079, "res": {"Yes": 0.999184866352079, "No": 0.0008150900174204629}, "ground_truth": 0}, {"key": "36962388", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7370888778249322, "res": {"Yes": 0.7370888778249322, "No": 0.26291039717664116}, "ground_truth": 0}, {"key": "36962388", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7841440800048425, "res": {"Yes": 0.7841440800048425, "No": 0.2158550416631522}, "ground_truth": 0}, {"key": "36962388", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9415353077451932, "res": {"Yes": 0.9415353077451932, "No": 0.05846435656054361}, "ground_truth": 1}, {"key": "36962388", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9795434218032204, "res": {"Yes": 0.9795434218032204, "No": 0.02045423760728205}, "ground_truth": 0}, {"key": "36962388", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5303203876900479, "res": {"Yes": 0.5303203876900479, "No": 0.4696729629435221}, "ground_truth": 0}, {"key": "32282272", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 8.750219134093826e-08, "res": {"No": 0.9999998063873687, "Yes": 8.750219134093826e-08}, "ground_truth": 0}, {"key": "32282272", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9794394468285825, "res": {"Yes": 0.9794394468285825, "No": 0.020559702671554676}, "ground_truth": 0}, {"key": "32282272", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9880912640303418, "res": {"Yes": 0.9880912640303418, "No": 0.011907693204199238}, "ground_truth": 1}, {"key": "32282272", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8454280515555076, "res": {"Yes": 0.8454280515555076, "No": 0.15456942976417617}, "ground_truth": 0}, {"key": "32282272", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.3283228026958734, "res": {"No": 0.6716756961233488, "Yes": 0.3283228026958734}, "ground_truth": 0}, {"key": "36093072", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5379755854793338, "res": {"Yes": 0.5379755854793338, "No": 0.4620175692240422}, "ground_truth": 0}, {"key": "36093072", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.998829748179347, "res": {"Yes": 0.998829748179347, "No": 0.001169509323221039}, "ground_truth": 0}, {"key": "36093072", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9885774157990002, "res": {"Yes": 0.9885774157990002, "No": 0.011419666252570744}, "ground_truth": 1}, {"key": "36093072", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975079500250037, "res": {"Yes": 0.9975079500250037, "No": 0.002491634644903062}, "ground_truth": 0}, {"key": "36093072", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9313492898488067, "res": {"Yes": 0.9313492898488067, "No": 0.06864846546778491}, "ground_truth": 0}, {"key": "38879972", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.002279049064477812, "res": {"No": 0.9977206676320963, "Yes": 0.002279049064477812}, "ground_truth": 0}, {"key": "38879972", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992337873309565, "res": {"Yes": 0.9992337873309565, "No": 0.0007657115696958745}, "ground_truth": 0}, {"key": "38879972", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9948610876221375, "res": {"Yes": 0.9948610876221375, "No": 0.005138633967061578}, "ground_truth": 1}, {"key": "38879972", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9937260300588509, "res": {"Yes": 0.9937260300588509, "No": 0.006273300922196564}, "ground_truth": 0}, {"key": "38879972", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994303291740754, "res": {"Yes": 0.9994303291740754, "No": 0.000569520374270816}, "ground_truth": 0}, {"key": "32106473", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996163522716176, "res": {"Yes": 0.9996163522716176, "No": 0.00038355827232644925}, "ground_truth": 0}, {"key": "32106473", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989767649623579, "res": {"Yes": 0.9989767649623579, "No": 0.0010227550126683212}, "ground_truth": 0}, {"key": "32106473", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9978873069841938, "res": {"Yes": 0.9978873069841938, "No": 0.0021099152461549107}, "ground_truth": 1}, {"key": "32106473", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997160594587478, "res": {"Yes": 0.9997160594587478, "No": 0.0002837942653789779}, "ground_truth": 0}, {"key": "32106473", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9955197736913162, "res": {"Yes": 0.9955197736913162, "No": 0.004479577701752293}, "ground_truth": 0}, {"key": "40415815", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0002313291430283353, "res": {"No": 0.999768477225535, "Yes": 0.0002313291430283353}, "ground_truth": 0}, {"key": "40415815", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9928050206933741, "res": {"Yes": 0.9928050206933741, "No": 0.007194870049708531}, "ground_truth": 0}, {"key": "40415815", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99911275633363, "res": {"Yes": 0.99911275633363, "No": 0.0008871205298940681}, "ground_truth": 1}, {"key": "40415815", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9973189172393873, "res": {"Yes": 0.9973189172393873, "No": 0.002680939462975086}, "ground_truth": 0}, {"key": "40415815", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9973315941409796, "res": {"Yes": 0.9973315941409796, "No": 0.0026682298605791408}, "ground_truth": 0}, {"key": "34581918", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6670575866411443, "res": {"Yes": 0.6670575866411443, "No": 0.33294199279045744}, "ground_truth": 0}, {"key": "34581918", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999040904456155, "res": {"Yes": 0.9999040904456155, "No": 9.553260071377592e-05}, "ground_truth": 0}, {"key": "34581918", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999168440936441, "res": {"Yes": 0.9999168440936441, "No": 8.252229984474398e-05}, "ground_truth": 1}, {"key": "34581918", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.996339896467949, "res": {"Yes": 0.996339896467949, "No": 0.0036594442037470557}, "ground_truth": 0}, {"key": "34581918", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9952326430925791, "res": {"Yes": 0.9952326430925791, "No": 0.00476703862601078}, "ground_truth": 0}, {"key": "33004157", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9942972945095122, "res": {"Yes": 0.9942972945095122, "No": 0.005702339783702927}, "ground_truth": 0}, {"key": "33004157", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991586852338903, "res": {"Yes": 0.9991586852338903, "No": 0.0008395728561857237}, "ground_truth": 0}, {"key": "33004157", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998752536714703, "res": {"Yes": 0.9998752536714703, "No": 0.0001243649711134938}, "ground_truth": 1}, {"key": "33004157", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9959786239753367, "res": {"Yes": 0.9959786239753367, "No": 0.004020738446747381}, "ground_truth": 0}, {"key": "33004157", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999663107274963, "res": {"Yes": 0.9999663107274963, "No": 3.3191524525805204e-05}, "ground_truth": 0}, {"key": "30334943", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9815784988621491, "res": {"Yes": 0.9815784988621491, "No": 0.018421225857803498}, "ground_truth": 0}, {"key": "30334943", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996030140197951, "res": {"Yes": 0.9996030140197951, "No": 0.00039648712065581737}, "ground_truth": 0}, {"key": "30334943", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9927919787958824, "res": {"Yes": 0.9927919787958824, "No": 0.0072067247197655435}, "ground_truth": 1}, {"key": "30334943", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9972569074726776, "res": {"Yes": 0.9972569074726776, "No": 0.0027423775934791103}, "ground_truth": 0}, {"key": "30334943", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9229018667615062, "res": {"Yes": 0.9229018667615062, "No": 0.07709541256411222}, "ground_truth": 0}, {"key": "33280503", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9982081408000202, "res": {"Yes": 0.9982081408000202, "No": 0.0017914969924668395}, "ground_truth": 0}, {"key": "33280503", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9960679141744727, "res": {"Yes": 0.9960679141744727, "No": 0.003931743157162458}, "ground_truth": 0}, {"key": "33280503", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.993030675571408, "res": {"Yes": 0.993030675571408, "No": 0.006968895023438646}, "ground_truth": 1}, {"key": "33280503", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989175226018027, "res": {"Yes": 0.9989175226018027, "No": 0.0010821191331976674}, "ground_truth": 0}, {"key": "33280503", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9923917007567437, "res": {"Yes": 0.9923917007567437, "No": 0.007607733372718848}, "ground_truth": 0}, {"key": "25726782", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8776993324076479, "res": {"Yes": 0.8776993324076479, "No": 0.12229929510017737}, "ground_truth": 0}, {"key": "25726782", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999177976487984, "res": {"Yes": 0.9999177976487984, "No": 8.211350996907853e-05}, "ground_truth": 0}, {"key": "25726782", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995606062817066, "res": {"Yes": 0.9995606062817066, "No": 0.00043851962162666085}, "ground_truth": 1}, {"key": "25726782", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999708403221517, "res": {"Yes": 0.9999708403221517, "No": 2.8983872597383487e-05}, "ground_truth": 0}, {"key": "25726782", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999777296302151, "res": {"Yes": 0.999777296302151, "No": 0.0002225590718798065}, "ground_truth": 0}, {"key": "35479854", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9845557182741034, "res": {"Yes": 0.9845557182741034, "No": 0.015442137574865745}, "ground_truth": 0}, {"key": "35479854", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.963208561371494, "res": {"Yes": 0.963208561371494, "No": 0.03678756494553924}, "ground_truth": 0}, {"key": "35479854", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9080875176032284, "res": {"Yes": 0.9080875176032284, "No": 0.09190752228796757}, "ground_truth": 1}, {"key": "35479854", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996312434874021, "res": {"Yes": 0.9996312434874021, "No": 0.0003637113497888626}, "ground_truth": 0}, {"key": "35479854", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9546219220778243, "res": {"Yes": 0.9546219220778243, "No": 0.04537577076431566}, "ground_truth": 0}, {"key": "32716226", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999282867615172, "res": {"Yes": 0.9999282867615172, "No": 7.082107018897215e-05}, "ground_truth": 0}, {"key": "32716226", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.998595992142549, "res": {"Yes": 0.998595992142549, "No": 0.0014037767443757028}, "ground_truth": 0}, {"key": "32716226", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9977661207303795, "res": {"Yes": 0.9977661207303795, "No": 0.002233043110991302}, "ground_truth": 1}, {"key": "32716226", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997722908696604, "res": {"Yes": 0.9997722908696604, "No": 0.00022660933823573533}, "ground_truth": 0}, {"key": "32716226", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999198239442718, "res": {"Yes": 0.9999198239442718, "No": 7.982139353715738e-05}, "ground_truth": 0}, {"key": "37047554", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9648302479278407, "res": {"Yes": 0.9648302479278407, "No": 0.03516901991354932}, "ground_truth": 0}, {"key": "37047554", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9958142786535726, "res": {"Yes": 0.9958142786535726, "No": 0.004185352705907267}, "ground_truth": 0}, {"key": "37047554", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988003691330953, "res": {"Yes": 0.9988003691330953, "No": 0.001199425484198233}, "ground_truth": 1}, {"key": "37047554", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9934014701425761, "res": {"Yes": 0.9934014701425761, "No": 0.006596302593723024}, "ground_truth": 0}, {"key": "37047554", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.991254665857521, "res": {"Yes": 0.991254665857521, "No": 0.00874478024538487}, "ground_truth": 0}, {"key": "36565290", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9966872150211169, "res": {"Yes": 0.9966872150211169, "No": 0.003311943837100813}, "ground_truth": 0}, {"key": "36565290", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993682980577381, "res": {"Yes": 0.9993682980577381, "No": 0.000631221580107556}, "ground_truth": 0}, {"key": "36565290", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988076246450894, "res": {"Yes": 0.9988076246450894, "No": 0.0011896551544872329}, "ground_truth": 1}, {"key": "36565290", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9870698658351696, "res": {"Yes": 0.9870698658351696, "No": 0.012921237544975116}, "ground_truth": 0}, {"key": "36565290", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977301638828309, "res": {"Yes": 0.9977301638828309, "No": 0.002267347347911906}, "ground_truth": 0}, {"key": "27758640", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 7.16764009872072e-05, "res": {"No": 0.9999281675700725, "Yes": 7.16764009872072e-05}, "ground_truth": 0}, {"key": "27758640", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9964619146266488, "res": {"Yes": 0.9964619146266488, "No": 0.003537613258458246}, "ground_truth": 0}, {"key": "27758640", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9938514209536098, "res": {"Yes": 0.9938514209536098, "No": 0.006148236415469431}, "ground_truth": 1}, {"key": "27758640", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9865236965270545, "res": {"Yes": 0.9865236965270545, "No": 0.013470798640576268}, "ground_truth": 0}, {"key": "27758640", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9853777724570348, "res": {"Yes": 0.9853777724570348, "No": 0.014620092466828993}, "ground_truth": 0}, {"key": "28897118", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9976770040409421, "res": {"Yes": 0.9976770040409421, "No": 0.0023229508114461284}, "ground_truth": 0}, {"key": "28897118", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999360344758814, "res": {"Yes": 0.9999360344758814, "No": 6.390736148551304e-05}, "ground_truth": 0}, {"key": "28897118", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999214926618624, "res": {"Yes": 0.9999214926618624, "No": 7.821618206835872e-05}, "ground_truth": 1}, {"key": "28897118", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998020817783959, "res": {"Yes": 0.9998020817783959, "No": 0.00019771677116494924}, "ground_truth": 0}, {"key": "28897118", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993579449056404, "res": {"Yes": 0.9993579449056404, "No": 0.0006417472650040365}, "ground_truth": 0}, {"key": "38452661", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 2.030515208136584e-06, "res": {"No": 0.9999971839107652, "Yes": 2.030515208136584e-06}, "ground_truth": 0}, {"key": "38452661", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985477267708747, "res": {"Yes": 0.9985477267708747, "No": 0.0014517072519809517}, "ground_truth": 0}, {"key": "38452661", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990095990710669, "res": {"Yes": 0.9990095990710669, "No": 0.0009901378322812089}, "ground_truth": 1}, {"key": "38452661", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9955335994663864, "res": {"Yes": 0.9955335994663864, "No": 0.00446633105703933}, "ground_truth": 0}, {"key": "38452661", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996050323502665, "res": {"Yes": 0.9996050323502665, "No": 0.00039408741807097074}, "ground_truth": 0}, {"key": "38033492", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999472389619125, "res": {"Yes": 0.9999472389619125, "No": 5.2628329476556096e-05}, "ground_truth": 0}, {"key": "38033492", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994689115774082, "res": {"Yes": 0.9994689115774082, "No": 0.0005309103411698153}, "ground_truth": 0}, {"key": "38033492", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999959918780326, "res": {"Yes": 0.9999959918780326, "No": 3.777723418531904e-06}, "ground_truth": 1}, {"key": "38033492", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999972151525776, "res": {"Yes": 0.999972151525776, "No": 2.77316554842879e-05}, "ground_truth": 0}, {"key": "38033492", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999280483736425, "res": {"Yes": 0.9999280483736425, "No": 7.181293104543356e-05}, "ground_truth": 0}, {"key": "35949555", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0011577423734667207, "res": {"No": 0.9988414056892488, "Yes": 0.0011577423734667207}, "ground_truth": 0}, {"key": "35949555", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.4211081036481551, "res": {"No": 0.5788784525257, "Yes": 0.4211081036481551}, "ground_truth": 0}, {"key": "35949555", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6994436819384408, "res": {"Yes": 0.6994436819384408, "No": 0.3005539821626939}, "ground_truth": 1}, {"key": "35949555", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07013036582942274, "res": {"No": 0.9298356861537199, "Yes": 0.07013036582942274}, "ground_truth": 0}, {"key": "35949555", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6385921572109093, "res": {"Yes": 0.6385921572109093, "No": 0.3613937842712497}, "ground_truth": 0}, {"key": "15263826", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.006842771769307697, "res": {"No": 0.9931567169376706, "Yes": 0.006842771769307697}, "ground_truth": 0}, {"key": "15263826", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.988260176858529, "res": {"Yes": 0.988260176858529, "No": 0.011739493601116813}, "ground_truth": 0}, {"key": "15263826", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.993193872817258, "res": {"Yes": 0.993193872817258, "No": 0.00680471176589403}, "ground_truth": 1}, {"key": "15263826", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9888269197332227, "res": {"Yes": 0.9888269197332227, "No": 0.011172766770717716}, "ground_truth": 0}, {"key": "15263826", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.986385210159486, "res": {"Yes": 0.986385210159486, "No": 0.01361380401367284}, "ground_truth": 0}, {"key": "37313866", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.007392537008704406, "res": {"No": 0.9926073083707686, "Yes": 0.007392537008704406}, "ground_truth": 0}, {"key": "37313866", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.02574749598247158, "res": {"No": 0.9742508074229975, "Yes": 0.02574749598247158}, "ground_truth": 0}, {"key": "37313866", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0001679144389934066, "res": {"No": 0.9998311584553382, "Yes": 0.0001679144389934066}, "ground_truth": 1}, {"key": "37313866", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06942345501861158, "res": {"No": 0.930574431717572, "Yes": 0.06942345501861158}, "ground_truth": 0}, {"key": "37313866", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1444763865011972, "res": {"No": 0.8555213241592381, "Yes": 0.1444763865011972}, "ground_truth": 0}, {"key": "13911157", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9989444082293766, "res": {"Yes": 0.9989444082293766, "No": 0.0010553796700179111}, "ground_truth": 0}, {"key": "13911157", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995735864701022, "res": {"Yes": 0.9995735864701022, "No": 0.0004259911442740772}, "ground_truth": 0}, {"key": "13911157", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995395277199169, "res": {"Yes": 0.9995395277199169, "No": 0.00045978457196190213}, "ground_truth": 1}, {"key": "13911157", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992560432731353, "res": {"Yes": 0.9992560432731353, "No": 0.0007436600125157261}, "ground_truth": 0}, {"key": "13911157", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982058835545035, "res": {"Yes": 0.9982058835545035, "No": 0.0017933731340762766}, "ground_truth": 0}, {"key": "39594894", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.12321380260827489, "res": {"No": 0.8767854739891849, "Yes": 0.12321380260827489}, "ground_truth": 0}, {"key": "39594894", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9964890175635543, "res": {"Yes": 0.9964890175635543, "No": 0.003510594087951063}, "ground_truth": 0}, {"key": "39594894", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998784552455445, "res": {"Yes": 0.998784552455445, "No": 0.0012153556852127752}, "ground_truth": 1}, {"key": "39594894", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989107390758315, "res": {"Yes": 0.9989107390758315, "No": 0.0010890767064504795}, "ground_truth": 0}, {"key": "39594894", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974510117017966, "res": {"Yes": 0.9974510117017966, "No": 0.0025488270653627808}, "ground_truth": 0}, {"key": "34096170", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.998273596651648, "res": {"Yes": 0.998273596651648, "No": 0.0017257940768748423}, "ground_truth": 0}, {"key": "34096170", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980783309747897, "res": {"Yes": 0.9980783309747897, "No": 0.0019212620330405906}, "ground_truth": 0}, {"key": "34096170", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974367876530655, "res": {"Yes": 0.9974367876530655, "No": 0.0025628980756180184}, "ground_truth": 1}, {"key": "34096170", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997236863416524, "res": {"Yes": 0.9997236863416524, "No": 0.00027603303703730526}, "ground_truth": 0}, {"key": "34096170", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993409171905551, "res": {"Yes": 0.9993409171905551, "No": 0.0006585654823758722}, "ground_truth": 0}, {"key": "37891952", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9949328246671293, "res": {"Yes": 0.9949328246671293, "No": 0.005066805696884085}, "ground_truth": 0}, {"key": "37891952", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9962018050592062, "res": {"Yes": 0.9962018050592062, "No": 0.0037978620082234488}, "ground_truth": 0}, {"key": "37891952", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9979992581576075, "res": {"Yes": 0.9979992581576075, "No": 0.001999772809749213}, "ground_truth": 1}, {"key": "37891952", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989420267487461, "res": {"Yes": 0.9989420267487461, "No": 0.001057702686170344}, "ground_truth": 0}, {"key": "37891952", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990540941112881, "res": {"Yes": 0.9990540941112881, "No": 0.0009456456842805685}, "ground_truth": 0}, {"key": "40186158", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.001161666926226893, "res": {"No": 0.9988379528003616, "Yes": 0.001161666926226893}, "ground_truth": 0}, {"key": "40186158", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981698998791989, "res": {"Yes": 0.9981698998791989, "No": 0.001829787388547393}, "ground_truth": 0}, {"key": "40186158", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976901682763246, "res": {"Yes": 0.9976901682763246, "No": 0.002309726176006514}, "ground_truth": 1}, {"key": "40186158", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975622827701751, "res": {"Yes": 0.9975622827701751, "No": 0.002437653701633197}, "ground_truth": 0}, {"key": "40186158", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994524777450445, "res": {"Yes": 0.9994524777450445, "No": 0.0005472486984009704}, "ground_truth": 0}, {"key": "37049719", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.04945398191948016, "res": {"No": 0.9505456983380093, "Yes": 0.04945398191948016}, "ground_truth": 0}, {"key": "37049719", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7944159090132312, "res": {"Yes": 0.7944159090132312, "No": 0.20558306859167097}, "ground_truth": 0}, {"key": "37049719", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.995853528948969, "res": {"Yes": 0.995853528948969, "No": 0.004146249866088615}, "ground_truth": 1}, {"key": "37049719", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9683231216965452, "res": {"Yes": 0.9683231216965452, "No": 0.03167505868670041}, "ground_truth": 0}, {"key": "37049719", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9839470198453254, "res": {"Yes": 0.9839470198453254, "No": 0.016051825460770417}, "ground_truth": 0}, {"key": "34610504", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8703934049001374, "res": {"Yes": 0.8703934049001374, "No": 0.12960410774538683}, "ground_truth": 0}, {"key": "34610504", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993135371934755, "res": {"Yes": 0.9993135371934755, "No": 0.0006856044500251324}, "ground_truth": 0}, {"key": "34610504", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992698423948916, "res": {"Yes": 0.9992698423948916, "No": 0.0007299350502794731}, "ground_truth": 1}, {"key": "34610504", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9943616539762042, "res": {"Yes": 0.9943616539762042, "No": 0.005637818945811418}, "ground_truth": 0}, {"key": "34610504", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9979766952462359, "res": {"Yes": 0.9979766952462359, "No": 0.002022466849538151}, "ground_truth": 0}, {"key": "37595429", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.994341494492389, "res": {"Yes": 0.994341494492389, "No": 0.005656814807679039}, "ground_truth": 0}, {"key": "37595429", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9300576365223279, "res": {"Yes": 0.9300576365223279, "No": 0.06993949275128214}, "ground_truth": 0}, {"key": "37595429", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968390497559011, "res": {"Yes": 0.9968390497559011, "No": 0.003160158798361166}, "ground_truth": 1}, {"key": "37595429", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9952990123942776, "res": {"Yes": 0.9952990123942776, "No": 0.004699339086723902}, "ground_truth": 0}, {"key": "37595429", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989754550049849, "res": {"Yes": 0.9989754550049849, "No": 0.001022406312665731}, "ground_truth": 0}, {"key": "29772670", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9983883647810649, "res": {"Yes": 0.9983883647810649, "No": 0.001611159778505209}, "ground_truth": 0}, {"key": "29772670", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8828339218882011, "res": {"Yes": 0.8828339218882011, "No": 0.1171636152645462}, "ground_truth": 0}, {"key": "29772670", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.46770381375841286, "res": {"No": 0.5322896409058638, "Yes": 0.46770381375841286}, "ground_truth": 1}, {"key": "29772670", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7498915371823804, "res": {"Yes": 0.7498915371823804, "No": 0.2501008356101467}, "ground_truth": 0}, {"key": "29772670", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7478286909735584, "res": {"Yes": 0.7478286909735584, "No": 0.25215941305103406}, "ground_truth": 0}, {"key": "36369872", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9777358396880933, "res": {"Yes": 0.9777358396880933, "No": 0.022262640930227087}, "ground_truth": 0}, {"key": "36369872", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9852866824340013, "res": {"Yes": 0.9852866824340013, "No": 0.014712673702622758}, "ground_truth": 0}, {"key": "36369872", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9027676027354963, "res": {"Yes": 0.9027676027354963, "No": 0.09723184477790293}, "ground_truth": 1}, {"key": "36369872", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9511252154159983, "res": {"Yes": 0.9511252154159983, "No": 0.04887386419126694}, "ground_truth": 0}, {"key": "36369872", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8998600569731998, "res": {"Yes": 0.8998600569731998, "No": 0.10013837494931072}, "ground_truth": 0}, {"key": "34527433", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00445964817763503, "res": {"No": 0.9955393886106529, "Yes": 0.00445964817763503}, "ground_truth": 0}, {"key": "34527433", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9976473420480464, "res": {"Yes": 0.9976473420480464, "No": 0.002351598427805832}, "ground_truth": 0}, {"key": "34527433", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9845524830293286, "res": {"Yes": 0.9845524830293286, "No": 0.01544715399577271}, "ground_truth": 1}, {"key": "34527433", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9862317854345748, "res": {"Yes": 0.9862317854345748, "No": 0.013767562460916183}, "ground_truth": 0}, {"key": "34527433", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9853157330548084, "res": {"Yes": 0.9853157330548084, "No": 0.014683894471574614}, "ground_truth": 0}, {"key": "31111734", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4830210714938017, "res": {"No": 0.5169719299749522, "Yes": 0.4830210714938017}, "ground_truth": 0}, {"key": "31111734", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.06078525718032174, "res": {"No": 0.9391904248186901, "Yes": 0.06078525718032174}, "ground_truth": 0}, {"key": "31111734", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.012580264531371059, "res": {"No": 0.9874148290399438, "Yes": 0.012580264531371059}, "ground_truth": 1}, {"key": "31111734", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.675225905017832, "res": {"Yes": 0.675225905017832, "No": 0.3247564701988104}, "ground_truth": 0}, {"key": "31111734", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7383371100442555, "res": {"Yes": 0.7383371100442555, "No": 0.26165728605023353}, "ground_truth": 0}, {"key": "40303872", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0053040075640322405, "res": {"No": 0.994695805183648, "Yes": 0.0053040075640322405}, "ground_truth": 0}, {"key": "40303872", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.910162525470579, "res": {"Yes": 0.910162525470579, "No": 0.0898334031609178}, "ground_truth": 0}, {"key": "40303872", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9810675357544572, "res": {"Yes": 0.9810675357544572, "No": 0.018930833198829912}, "ground_truth": 1}, {"key": "40303872", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986574552206681, "res": {"Yes": 0.9986574552206681, "No": 0.00134087887921958}, "ground_truth": 0}, {"key": "40303872", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8662662063706861, "res": {"Yes": 0.8662662063706861, "No": 0.1337314492528924}, "ground_truth": 0}, {"key": "33653553", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8779205229520542, "res": {"Yes": 0.8779205229520542, "No": 0.12207652216686592}, "ground_truth": 0}, {"key": "33653553", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9983650754476404, "res": {"Yes": 0.9983650754476404, "No": 0.001634822570652791}, "ground_truth": 0}, {"key": "33653553", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974635895386116, "res": {"Yes": 0.9974635895386116, "No": 0.0025358720427727864}, "ground_truth": 1}, {"key": "33653553", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9788389838487594, "res": {"Yes": 0.9788389838487594, "No": 0.02116039087096161}, "ground_truth": 0}, {"key": "33653553", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974683309930537, "res": {"Yes": 0.9974683309930537, "No": 0.0025315252304579676}, "ground_truth": 0}, {"key": "34404510", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9563734348267628, "res": {"Yes": 0.9563734348267628, "No": 0.04362605130796509}, "ground_truth": 0}, {"key": "34404510", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993427041136467, "res": {"Yes": 0.9993427041136467, "No": 0.0006539105431743227}, "ground_truth": 0}, {"key": "34404510", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996037216190272, "res": {"Yes": 0.9996037216190272, "No": 0.000395757582327283}, "ground_truth": 1}, {"key": "34404510", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992768665870823, "res": {"Yes": 0.9992768665870823, "No": 0.0007220555377055122}, "ground_truth": 0}, {"key": "34404510", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9958006822965574, "res": {"Yes": 0.9958006822965574, "No": 0.004198793738765157}, "ground_truth": 0}, {"key": "35568692", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.024947716101315312, "res": {"No": 0.9750241227580918, "Yes": 0.024947716101315312}, "ground_truth": 0}, {"key": "35568692", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.019936132303252762, "res": {"No": 0.9800531461721964, "Yes": 0.019936132303252762}, "ground_truth": 0}, {"key": "35568692", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6563375266676948, "res": {"Yes": 0.6563375266676948, "No": 0.34365219298009786}, "ground_truth": 1}, {"key": "35568692", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5000785664520135, "res": {"Yes": 0.5000785664520135, "No": 0.4999030996708598}, "ground_truth": 0}, {"key": "35568692", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.4010213424598384, "res": {"No": 0.5989440445528413, "Yes": 0.4010213424598384}, "ground_truth": 0}, {"key": "39151664", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9836904133623845, "res": {"Yes": 0.9836904133623845, "No": 0.016308187445639066}, "ground_truth": 0}, {"key": "39151664", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.33108514534265465, "res": {"No": 0.6688945530743431, "Yes": 0.33108514534265465}, "ground_truth": 0}, {"key": "39151664", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9863579537535635, "res": {"Yes": 0.9863579537535635, "No": 0.013638690985187763}, "ground_truth": 1}, {"key": "39151664", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2200515372141636, "res": {"No": 0.7799332031131366, "Yes": 0.2200515372141636}, "ground_truth": 0}, {"key": "39151664", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1676890680189847, "res": {"No": 0.8322966177311742, "Yes": 0.1676890680189847}, "ground_truth": 0}, {"key": "37493670", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9707502624620628, "res": {"Yes": 0.9707502624620628, "No": 0.029247768465278157}, "ground_truth": 0}, {"key": "37493670", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997712182745312, "res": {"Yes": 0.9997712182745312, "No": 0.0002271118342287936}, "ground_truth": 0}, {"key": "37493670", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999818286721858, "res": {"Yes": 0.999818286721858, "No": 0.0001804068463704797}, "ground_truth": 1}, {"key": "37493670", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995622743898207, "res": {"Yes": 0.9995622743898207, "No": 0.000436259634446667}, "ground_truth": 0}, {"key": "37493670", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985509371069768, "res": {"Yes": 0.9985509371069768, "No": 0.0014465266643730625}, "ground_truth": 0}, {"key": "21935983", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999267372238483, "res": {"Yes": 0.9999267372238483, "No": 7.26859101735185e-05}, "ground_truth": 0}, {"key": "21935983", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9944119903343245, "res": {"Yes": 0.9944119903343245, "No": 0.005587552070392311}, "ground_truth": 0}, {"key": "21935983", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997831359983979, "res": {"Yes": 0.9997831359983979, "No": 0.00021632449195516253}, "ground_truth": 1}, {"key": "21935983", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994134194057027, "res": {"Yes": 0.9994134194057027, "No": 0.0005863505728977694}, "ground_truth": 0}, {"key": "21935983", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9966360587712941, "res": {"Yes": 0.9966360587712941, "No": 0.0033621433721705476}, "ground_truth": 0}, {"key": "38174214", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9982190659484449, "res": {"Yes": 0.9982190659484449, "No": 0.0017806834993214103}, "ground_truth": 0}, {"key": "38174214", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.711009477109356, "res": {"Yes": 0.711009477109356, "No": 0.28898624128886746}, "ground_truth": 0}, {"key": "38174214", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9977237560812031, "res": {"Yes": 0.9977237560812031, "No": 0.002275981252023504}, "ground_truth": 1}, {"key": "38174214", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6884603165637163, "res": {"Yes": 0.6884603165637163, "No": 0.31153742609322155}, "ground_truth": 0}, {"key": "38174214", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.659937595965085, "res": {"Yes": 0.659937595965085, "No": 0.34005683961701805}, "ground_truth": 0}, {"key": "40319923", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3393480507223131, "res": {"No": 0.6606480511659151, "Yes": 0.3393480507223131}, "ground_truth": 0}, {"key": "40319923", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8734201215604315, "res": {"Yes": 0.8734201215604315, "No": 0.12657817215179293}, "ground_truth": 0}, {"key": "40319923", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9949250376568638, "res": {"Yes": 0.9949250376568638, "No": 0.005073400378975768}, "ground_truth": 1}, {"key": "40319923", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8819857143399479, "res": {"Yes": 0.8819857143399479, "No": 0.1180109691427515}, "ground_truth": 0}, {"key": "40319923", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.38226939362957174, "res": {"No": 0.6177189490289726, "Yes": 0.38226939362957174}, "ground_truth": 0}, {"key": "36478264", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9917102966663541, "res": {"Yes": 0.9917102966663541, "No": 0.008288729321925314}, "ground_truth": 0}, {"key": "36478264", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9924042640190015, "res": {"Yes": 0.9924042640190015, "No": 0.007595332234853186}, "ground_truth": 0}, {"key": "36478264", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987215339349488, "res": {"Yes": 0.9987215339349488, "No": 0.0012779866104983837}, "ground_truth": 1}, {"key": "36478264", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993500862554875, "res": {"Yes": 0.9993500862554875, "No": 0.0006497109410906637}, "ground_truth": 0}, {"key": "36478264", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988675710821123, "res": {"Yes": 0.9988675710821123, "No": 0.0011320147151913395}, "ground_truth": 0}, {"key": "11935769", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.10808461352895166, "res": {"No": 0.8919099450169119, "Yes": 0.10808461352895166}, "ground_truth": 0}, {"key": "11935769", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991720138998202, "res": {"Yes": 0.9991720138998202, "No": 0.0008274730659033995}, "ground_truth": 0}, {"key": "11935769", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993374626048896, "res": {"Yes": 0.9993374626048896, "No": 0.0006622792256129154}, "ground_truth": 1}, {"key": "11935769", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971937198862579, "res": {"Yes": 0.9971937198862579, "No": 0.0028058532424669828}, "ground_truth": 0}, {"key": "11935769", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9976622900099202, "res": {"Yes": 0.9976622900099202, "No": 0.0023361838831787384}, "ground_truth": 0}, {"key": "33373410", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 4.741324646558793e-06, "res": {"No": 0.9999950382530095, "Yes": 4.741324646558793e-06}, "ground_truth": 0}, {"key": "33373410", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9650212704200575, "res": {"Yes": 0.9650212704200575, "No": 0.034976740344408}, "ground_truth": 0}, {"key": "33373410", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9492869302171709, "res": {"Yes": 0.9492869302171709, "No": 0.0507090187291691}, "ground_truth": 1}, {"key": "33373410", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9353771612627745, "res": {"Yes": 0.9353771612627745, "No": 0.06462084772857392}, "ground_truth": 0}, {"key": "33373410", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.781597380279376, "res": {"Yes": 0.781597380279376, "No": 0.21839968006856125}, "ground_truth": 0}, {"key": "11130680", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.04208152797579754, "res": {"No": 0.9579174124748714, "Yes": 0.04208152797579754}, "ground_truth": 0}, {"key": "11130680", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.008322821159113357, "res": {"No": 0.9916762944783322, "Yes": 0.008322821159113357}, "ground_truth": 0}, {"key": "11130680", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8998343843319964, "res": {"Yes": 0.8998343843319964, "No": 0.10016302203608538}, "ground_truth": 1}, {"key": "11130680", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.09636189842975018, "res": {"No": 0.9036322901701891, "Yes": 0.09636189842975018}, "ground_truth": 0}, {"key": "11130680", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7930172299735804, "res": {"Yes": 0.7930172299735804, "No": 0.2069750964415279}, "ground_truth": 0}, {"key": "34868650", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9361985209139237, "res": {"Yes": 0.9361985209139237, "No": 0.0638010392231466}, "ground_truth": 0}, {"key": "34868650", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988944516693435, "res": {"Yes": 0.9988944516693435, "No": 0.0011049188341148214}, "ground_truth": 0}, {"key": "34868650", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9898609571899731, "res": {"Yes": 0.9898609571899731, "No": 0.010137123495584708}, "ground_truth": 1}, {"key": "34868650", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9931348455833329, "res": {"Yes": 0.9931348455833329, "No": 0.00686117890478317}, "ground_truth": 0}, {"key": "34868650", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.997510799909288, "res": {"Yes": 0.997510799909288, "No": 0.002486011649158828}, "ground_truth": 0}, {"key": "33960561", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09329227238635983, "res": {"No": 0.9067069764759654, "Yes": 0.09329227238635983}, "ground_truth": 0}, {"key": "33960561", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.982364066026496, "res": {"Yes": 0.982364066026496, "No": 0.017634994979212556}, "ground_truth": 0}, {"key": "33960561", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984080880381871, "res": {"Yes": 0.9984080880381871, "No": 0.0015913341922296476}, "ground_truth": 1}, {"key": "33960561", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9816652349702534, "res": {"Yes": 0.9816652349702534, "No": 0.018333257844481303}, "ground_truth": 0}, {"key": "33960561", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9916433545139449, "res": {"Yes": 0.9916433545139449, "No": 0.008356170759009756}, "ground_truth": 0}, {"key": "22504858", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8193301768776292, "res": {"Yes": 0.8193301768776292, "No": 0.18066947898393698}, "ground_truth": 0}, {"key": "22504858", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9983534346785624, "res": {"Yes": 0.9983534346785624, "No": 0.0016459286914377394}, "ground_truth": 0}, {"key": "22504858", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996517244820033, "res": {"Yes": 0.9996517244820033, "No": 0.00034765915423842287}, "ground_truth": 1}, {"key": "22504858", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999304322739465, "res": {"Yes": 0.9999304322739465, "No": 6.929630306616461e-05}, "ground_truth": 0}, {"key": "22504858", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999499805090164, "res": {"Yes": 0.9999499805090164, "No": 4.9570929244548674e-05}, "ground_truth": 0}, {"key": "32283530", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0056201102378112995, "res": {"No": 0.994373793018499, "Yes": 0.0056201102378112995}, "ground_truth": 0}, {"key": "32283530", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9950968823177956, "res": {"Yes": 0.9950968823177956, "No": 0.004902311256862561}, "ground_truth": 0}, {"key": "32283530", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0040191895546370735, "res": {"No": 0.9959786239753367, "Yes": 0.0040191895546370735}, "ground_truth": 1}, {"key": "32283530", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986148898517744, "res": {"Yes": 0.9986148898517744, "No": 0.0013843604706879093}, "ground_truth": 0}, {"key": "32283530", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.32132760498781693, "res": {"No": 0.6786694763387963, "Yes": 0.32132760498781693}, "ground_truth": 0}, {"key": "38377099", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0013121372272359027, "res": {"No": 0.99868764888687, "Yes": 0.0013121372272359027}, "ground_truth": 0}, {"key": "38377099", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999593971683173, "res": {"Yes": 0.9999593971683173, "No": 4.0529275221624534e-05}, "ground_truth": 0}, {"key": "38377099", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999481925440526, "res": {"Yes": 0.9999481925440526, "No": 5.129291112673326e-05}, "ground_truth": 1}, {"key": "38377099", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992955609737547, "res": {"Yes": 0.9992955609737547, "No": 0.000704336734578712}, "ground_truth": 0}, {"key": "38377099", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996273111857361, "res": {"Yes": 0.9996273111857361, "No": 0.0003722313456798794}, "ground_truth": 0}, {"key": "36105123", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9924257532773905, "res": {"Yes": 0.9924257532773905, "No": 0.0075736209270186655}, "ground_truth": 0}, {"key": "36105123", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0013676955988534776, "res": {"No": 0.9986311762949581, "Yes": 0.0013676955988534776}, "ground_truth": 0}, {"key": "36105123", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9843716796773617, "res": {"Yes": 0.9843716796773617, "No": 0.01562517786600723}, "ground_truth": 1}, {"key": "36105123", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975723537110364, "res": {"Yes": 0.9975723537110364, "No": 0.0024266659518718476}, "ground_truth": 0}, {"key": "36105123", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.003332227099124412, "res": {"No": 0.9966663744096724, "Yes": 0.003332227099124412}, "ground_truth": 0}, {"key": "33527826", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8932044651323717, "res": {"Yes": 0.8932044651323717, "No": 0.10679245510882251}, "ground_truth": 0}, {"key": "33527826", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9949416762258716, "res": {"Yes": 0.9949416762258716, "No": 0.005057872189669254}, "ground_truth": 0}, {"key": "33527826", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9754430635986068, "res": {"Yes": 0.9754430635986068, "No": 0.02455490618757897}, "ground_truth": 1}, {"key": "33527826", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.994240966379334, "res": {"Yes": 0.994240966379334, "No": 0.005756833471330265}, "ground_truth": 0}, {"key": "33527826", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9957089603327665, "res": {"Yes": 0.9957089603327665, "No": 0.004289746666001347}, "ground_truth": 0}, {"key": "32349891", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 3.25089732412622e-06, "res": {"No": 0.9999962302846054, "Yes": 3.25089732412622e-06}, "ground_truth": 0}, {"key": "32349891", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9185407403528085, "res": {"Yes": 0.9185407403528085, "No": 0.08145673162659127}, "ground_truth": 0}, {"key": "32349891", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3093877297001937, "res": {"No": 0.6906089944510967, "Yes": 0.3093877297001937}, "ground_truth": 1}, {"key": "32349891", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9093230112645336, "res": {"Yes": 0.9093230112645336, "No": 0.09067454606514552}, "ground_truth": 0}, {"key": "32349891", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6749074085750635, "res": {"Yes": 0.6749074085750635, "No": 0.32508779326783}, "ground_truth": 0}, {"key": "34281974", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9219409066961511, "res": {"Yes": 0.9219409066961511, "No": 0.07805804986930784}, "ground_truth": 0}, {"key": "34281974", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996181396672228, "res": {"Yes": 0.9996181396672228, "No": 0.0003805379303825255}, "ground_truth": 0}, {"key": "34281974", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990320735433099, "res": {"Yes": 0.9990320735433099, "No": 0.0009671823571404375}, "ground_truth": 1}, {"key": "34281974", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993897340880357, "res": {"Yes": 0.9993897340880357, "No": 0.0006096100911531065}, "ground_truth": 0}, {"key": "34281974", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9980820045086551, "res": {"Yes": 0.9980820045086551, "No": 0.0019164744592500224}, "ground_truth": 0}, {"key": "29387866", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9045062719575143, "res": {"Yes": 0.9045062719575143, "No": 0.09549222007472943}, "ground_truth": 0}, {"key": "29387866", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984967446219845, "res": {"Yes": 0.9984967446219845, "No": 0.0015028634860215812}, "ground_truth": 0}, {"key": "29387866", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987539988049058, "res": {"Yes": 0.9987539988049058, "No": 0.0012456684319605727}, "ground_truth": 1}, {"key": "29387866", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990895471839025, "res": {"Yes": 0.9990895471839025, "No": 0.0009103085044747205}, "ground_truth": 0}, {"key": "29387866", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995924091877131, "res": {"Yes": 0.9995924091877131, "No": 0.00040731366241926546}, "ground_truth": 0}, {"key": "35731925", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.856835009433514, "res": {"Yes": 0.856835009433514, "No": 0.14314289241220798}, "ground_truth": 0}, {"key": "35731925", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.09582983619087428, "res": {"No": 0.9041479956383325, "Yes": 0.09582983619087428}, "ground_truth": 0}, {"key": "35731925", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.04368958652061763, "res": {"No": 0.9562875276596905, "Yes": 0.04368958652061763}, "ground_truth": 1}, {"key": "35731925", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.05191154845390752, "res": {"No": 0.9480709270144648, "Yes": 0.05191154845390752}, "ground_truth": 0}, {"key": "35731925", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.08317144493340663, "res": {"No": 0.9168184581400681, "Yes": 0.08317144493340663}, "ground_truth": 0}, {"key": "38829733", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9941114826808465, "res": {"Yes": 0.9941114826808465, "No": 0.0058884704556010255}, "ground_truth": 0}, {"key": "38829733", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991826069478545, "res": {"Yes": 0.9991826069478545, "No": 0.0008170428634805554}, "ground_truth": 0}, {"key": "38829733", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999959918780326, "res": {"Yes": 0.9999959918780326, "No": 3.906674724110585e-06}, "ground_truth": 1}, {"key": "38829733", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996960427843574, "res": {"Yes": 0.9996960427843574, "No": 0.00030374014751505745}, "ground_truth": 0}, {"key": "38829733", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998939591587275, "res": {"Yes": 0.9998939591587275, "No": 0.00010569869620785134}, "ground_truth": 0}, {"key": "24624736", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.996910845786171, "res": {"Yes": 0.996910845786171, "No": 0.003088977960204771}, "ground_truth": 0}, {"key": "24624736", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994509325927083, "res": {"Yes": 0.9994509325927083, "No": 0.000548545844585349}, "ground_truth": 0}, {"key": "24624736", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995536991918477, "res": {"Yes": 0.9995536991918477, "No": 0.00044589145946071445}, "ground_truth": 1}, {"key": "24624736", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997883761554854, "res": {"Yes": 0.9997883761554854, "No": 0.00021091655007347368}, "ground_truth": 0}, {"key": "24624736", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999531663903603, "res": {"Yes": 0.999531663903603, "No": 0.0004678257314919392}, "ground_truth": 0}, {"key": "36928562", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.49959812686857635, "res": {"No": 0.5003915735297957, "Yes": 0.49959812686857635}, "ground_truth": 0}, {"key": "36928562", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.011535858090071434, "res": {"No": 0.9884633741552397, "Yes": 0.011535858090071434}, "ground_truth": 0}, {"key": "36928562", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.041321402206864116, "res": {"No": 0.958676062421901, "Yes": 0.041321402206864116}, "ground_truth": 1}, {"key": "36928562", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0036075478621608657, "res": {"No": 0.9963886511624042, "Yes": 0.0036075478621608657}, "ground_truth": 0}, {"key": "36928562", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0023634756743473625, "res": {"No": 0.9976345277492942, "Yes": 0.0023634756743473625}, "ground_truth": 0}, {"key": "34941119", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5009006304424364, "res": {"Yes": 0.5009006304424364, "No": 0.49909820449426046}, "ground_truth": 0}, {"key": "34941119", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991927200259528, "res": {"Yes": 0.9991927200259528, "No": 0.000806860876876795}, "ground_truth": 0}, {"key": "34941119", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9910822679618322, "res": {"Yes": 0.9910822679618322, "No": 0.008917300613449796}, "ground_truth": 1}, {"key": "34941119", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988257038260017, "res": {"Yes": 0.9988257038260017, "No": 0.0011741268664488141}, "ground_truth": 0}, {"key": "34941119", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9926666267677138, "res": {"Yes": 0.9926666267677138, "No": 0.0073313324444935594}, "ground_truth": 0}, {"key": "30206231", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9993522268456778, "res": {"Yes": 0.9993522268456778, "No": 0.0006475445264738015}, "ground_truth": 0}, {"key": "30206231", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980797586270554, "res": {"Yes": 0.9980797586270554, "No": 0.0019197993569339891}, "ground_truth": 0}, {"key": "30206231", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994766520943144, "res": {"Yes": 0.9994766520943144, "No": 0.0005231540953060148}, "ground_truth": 1}, {"key": "30206231", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9958149872752654, "res": {"Yes": 0.9958149872752654, "No": 0.004184334951893096}, "ground_truth": 0}, {"key": "30206231", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9946692650642474, "res": {"Yes": 0.9946692650642474, "No": 0.005327895283153364}, "ground_truth": 0}, {"key": "35584972", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9899262614612503, "res": {"Yes": 0.9899262614612503, "No": 0.010073379779622693}, "ground_truth": 0}, {"key": "35584972", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.4859193574609735, "res": {"No": 0.5140796111575349, "Yes": 0.4859193574609735}, "ground_truth": 0}, {"key": "35584972", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7405594980657692, "res": {"Yes": 0.7405594980657692, "No": 0.25943481565788845}, "ground_truth": 1}, {"key": "35584972", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9085200609425438, "res": {"Yes": 0.9085200609425438, "No": 0.09147061553241018}, "ground_truth": 0}, {"key": "35584972", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993097252892787, "res": {"Yes": 0.9993097252892787, "No": 0.0006900572450318502}, "ground_truth": 0}, {"key": "39277709", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.07045821076634289, "res": {"No": 0.929539980347091, "Yes": 0.07045821076634289}, "ground_truth": 0}, {"key": "39277709", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.3202736475582811, "res": {"No": 0.6797129651493538, "Yes": 0.3202736475582811}, "ground_truth": 0}, {"key": "39277709", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1423025150162498, "res": {"No": 0.8576964671287634, "Yes": 0.1423025150162498}, "ground_truth": 1}, {"key": "39277709", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8589977554341129, "res": {"Yes": 0.8589977554341129, "No": 0.1409999419931715}, "ground_truth": 0}, {"key": "39277709", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.06496892502110092, "res": {"No": 0.9350286158262628, "Yes": 0.06496892502110092}, "ground_truth": 0}, {"key": "36123657", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3399925069490248, "res": {"No": 0.6600066422481231, "Yes": 0.3399925069490248}, "ground_truth": 0}, {"key": "36123657", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9983432146865976, "res": {"Yes": 0.9983432146865976, "No": 0.0016560013629201397}, "ground_truth": 0}, {"key": "36123657", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9720251532765413, "res": {"Yes": 0.9720251532765413, "No": 0.027954773691312173}, "ground_truth": 1}, {"key": "36123657", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9935037137002697, "res": {"Yes": 0.9935037137002697, "No": 0.0064881184860345375}, "ground_truth": 0}, {"key": "36123657", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9952862570224592, "res": {"Yes": 0.9952862570224592, "No": 0.004712329062855523}, "ground_truth": 0}, {"key": "33363938", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 1.6859875327345867e-05, "res": {"No": 0.9999827604126034, "Yes": 1.6859875327345867e-05}, "ground_truth": 0}, {"key": "33363938", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0002948225228872893, "res": {"No": 0.9997040270286442, "Yes": 0.0002948225228872893}, "ground_truth": 0}, {"key": "33363938", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00023341279956624712, "res": {"No": 0.999766332054608, "Yes": 0.00023341279956624712}, "ground_truth": 1}, {"key": "33363938", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0011693187087368569, "res": {"No": 0.998830339886265, "Yes": 0.0011693187087368569}, "ground_truth": 0}, {"key": "33363938", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0017042621815476966, "res": {"No": 0.9982956829006745, "Yes": 0.0017042621815476966}, "ground_truth": 0}, {"key": "37349129", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.000771112716411618, "res": {"No": 0.999220934329368, "Yes": 0.000771112716411618}, "ground_truth": 0}, {"key": "37349129", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.010480614146929605, "res": {"No": 0.9895184899099019, "Yes": 0.010480614146929605}, "ground_truth": 0}, {"key": "37349129", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0010046088672900461, "res": {"No": 0.9989925882802444, "Yes": 0.0010046088672900461}, "ground_truth": 1}, {"key": "37349129", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.011592487731648182, "res": {"No": 0.9883980467927468, "Yes": 0.011592487731648182}, "ground_truth": 0}, {"key": "37349129", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.11519902434311546, "res": {"No": 0.8847930262232891, "Yes": 0.11519902434311546}, "ground_truth": 0}, {"key": "37160199", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9817115274675496, "res": {"Yes": 0.9817115274675496, "No": 0.018287527662349843}, "ground_truth": 0}, {"key": "37160199", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999407942934993, "res": {"Yes": 0.999407942934993, "No": 0.000591936613857176}, "ground_truth": 0}, {"key": "37160199", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9581026398808158, "res": {"Yes": 0.9581026398808158, "No": 0.04189423713740852}, "ground_truth": 1}, {"key": "37160199", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9951289940152396, "res": {"Yes": 0.9951289940152396, "No": 0.0048703523177363135}, "ground_truth": 0}, {"key": "37160199", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.998162890754771, "res": {"Yes": 0.998162890754771, "No": 0.001836060931946189}, "ground_truth": 0}, {"key": "35891053", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004444890698866177, "res": {"No": 0.995554984454658, "Yes": 0.004444890698866177}, "ground_truth": 0}, {"key": "35891053", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9218744371530342, "res": {"Yes": 0.9218744371530342, "No": 0.07812420085764754}, "ground_truth": 0}, {"key": "35891053", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980825993657071, "res": {"Yes": 0.9980825993657071, "No": 0.0019170749847655156}, "ground_truth": 1}, {"key": "35891053", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9929706039977225, "res": {"Yes": 0.9929706039977225, "No": 0.0070288898619743365}, "ground_truth": 0}, {"key": "35891053", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998671488654937, "res": {"Yes": 0.9998671488654937, "No": 0.00013274042878361225}, "ground_truth": 0}, {"key": "40694542", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9861666208429524, "res": {"Yes": 0.9861666208429524, "No": 0.013831877319019126}, "ground_truth": 0}, {"key": "40694542", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8329548583003374, "res": {"Yes": 0.8329548583003374, "No": 0.16702653282395227}, "ground_truth": 0}, {"key": "40694542", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.991610059655631, "res": {"Yes": 0.991610059655631, "No": 0.0083882740064007}, "ground_truth": 1}, {"key": "40694542", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9949822790322338, "res": {"Yes": 0.9949822790322338, "No": 0.005017032778576347}, "ground_truth": 0}, {"key": "40694542", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9582426135705695, "res": {"Yes": 0.9582426135705695, "No": 0.04175436843438573}, "ground_truth": 0}, {"key": "24645770", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9500356345864845, "res": {"Yes": 0.9500356345864845, "No": 0.04996412655290036}, "ground_truth": 0}, {"key": "24645770", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9935738363753823, "res": {"Yes": 0.9935738363753823, "No": 0.006426010399130124}, "ground_truth": 0}, {"key": "24645770", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9931770563002911, "res": {"Yes": 0.9931770563002911, "No": 0.006822843217099956}, "ground_truth": 1}, {"key": "24645770", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971340950687264, "res": {"Yes": 0.9971340950687264, "No": 0.0028657619873689276}, "ground_truth": 0}, {"key": "24645770", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9898979875911516, "res": {"Yes": 0.9898979875911516, "No": 0.010101721743598578}, "ground_truth": 0}, {"key": "37974587", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.998528718796974, "res": {"Yes": 0.998528718796974, "No": 0.0014699740961697301}, "ground_truth": 0}, {"key": "37974587", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996061047471125, "res": {"Yes": 0.9996061047471125, "No": 0.00039282254009358647}, "ground_truth": 0}, {"key": "37974587", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9765687760136395, "res": {"Yes": 0.9765687760136395, "No": 0.02343004045104972}, "ground_truth": 1}, {"key": "37974587", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3627561984412283, "res": {"No": 0.6372352259926005, "Yes": 0.3627561984412283}, "ground_truth": 0}, {"key": "37974587", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.010485303174260302, "res": {"No": 0.9895119531723484, "Yes": 0.010485303174260302}, "ground_truth": 0}, {"key": "40354149", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.008052066600014804, "res": {"No": 0.9919461286185041, "Yes": 0.008052066600014804}, "ground_truth": 0}, {"key": "40354149", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.30241972760970703, "res": {"No": 0.6975605353641664, "Yes": 0.30241972760970703}, "ground_truth": 0}, {"key": "40354149", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.07230392959858485, "res": {"No": 0.9276931947173255, "Yes": 0.07230392959858485}, "ground_truth": 1}, {"key": "40354149", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.02084810963157371, "res": {"No": 0.9791508965290399, "Yes": 0.02084810963157371}, "ground_truth": 0}, {"key": "40354149", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0848008765129568, "res": {"No": 0.915197197988253, "Yes": 0.0848008765129568}, "ground_truth": 0}, {"key": "35519470", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.992964500524069, "res": {"Yes": 0.992964500524069, "No": 0.007035257404214025}, "ground_truth": 0}, {"key": "35519470", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998578522539484, "res": {"Yes": 0.9998578522539484, "No": 0.00014209566926457384}, "ground_truth": 0}, {"key": "35519470", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9923472095592571, "res": {"Yes": 0.9923472095592571, "No": 0.007651483717114079}, "ground_truth": 1}, {"key": "35519470", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996592317346991, "res": {"Yes": 0.9996592317346991, "No": 0.0003397804786180147}, "ground_truth": 0}, {"key": "35519470", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991485651765075, "res": {"Yes": 0.9991485651765075, "No": 0.0008508230354140098}, "ground_truth": 0}, {"key": "36185624", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.011187278438020748, "res": {"No": 0.9888123385989712, "Yes": 0.011187278438020748}, "ground_truth": 0}, {"key": "36185624", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9756523819949456, "res": {"Yes": 0.9756523819949456, "No": 0.02434693281038549}, "ground_truth": 0}, {"key": "36185624", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9910422270649136, "res": {"Yes": 0.9910422270649136, "No": 0.008956184318576508}, "ground_truth": 1}, {"key": "36185624", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978220175532359, "res": {"Yes": 0.9978220175532359, "No": 0.002177462001296463}, "ground_truth": 0}, {"key": "36185624", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9938465935308269, "res": {"Yes": 0.9938465935308269, "No": 0.006152289438591663}, "ground_truth": 0}, {"key": "39306113", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5700387488645418, "res": {"Yes": 0.5700387488645418, "No": 0.42995965511945117}, "ground_truth": 0}, {"key": "39306113", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9875754737633243, "res": {"Yes": 0.9875754737633243, "No": 0.012424109246398876}, "ground_truth": 0}, {"key": "39306113", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8598036325938517, "res": {"Yes": 0.8598036325938517, "No": 0.1401937338143435}, "ground_truth": 1}, {"key": "39306113", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9801985850888787, "res": {"Yes": 0.9801985850888787, "No": 0.019799783018565546}, "ground_truth": 0}, {"key": "39306113", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9574176785769347, "res": {"Yes": 0.9574176785769347, "No": 0.04258005192705716}, "ground_truth": 0}, {"key": "19347718", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.013794169170281423, "res": {"No": 0.9862055781524357, "Yes": 0.013794169170281423}, "ground_truth": 0}, {"key": "19347718", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999362728606604, "res": {"Yes": 0.9999362728606604, "No": 6.358588793839589e-05}, "ground_truth": 0}, {"key": "19347718", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9979873836338783, "res": {"Yes": 0.9979873836338783, "No": 0.0020125755681202387}, "ground_truth": 1}, {"key": "19347718", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.04614273739375229, "res": {"No": 0.953857103920296, "Yes": 0.04614273739375229}, "ground_truth": 0}, {"key": "19347718", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994984442211723, "res": {"Yes": 0.9994984442211723, "No": 0.000501406704886006}, "ground_truth": 0}, {"key": "21870064", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998829936457775, "res": {"Yes": 0.9998829936457775, "No": 0.00011687962487679349}, "ground_truth": 0}, {"key": "21870064", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999975250738268, "res": {"Yes": 0.999975250738268, "No": 2.4439765955392548e-05}, "ground_truth": 0}, {"key": "21870064", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999944422379444, "res": {"Yes": 0.9999944422379444, "No": 5.424802851149654e-06}, "ground_truth": 1}, {"key": "21870064", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999934886141991, "res": {"Yes": 0.9999934886141991, "No": 6.3288690680852764e-06}, "ground_truth": 0}, {"key": "21870064", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999814491960682, "res": {"Yes": 0.9999814491960682, "No": 1.8419678152677423e-05}, "ground_truth": 0}, {"key": "37675776", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.984166575708737, "res": {"Yes": 0.984166575708737, "No": 0.01583243967154037}, "ground_truth": 0}, {"key": "37675776", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9938733184250416, "res": {"Yes": 0.9938733184250416, "No": 0.006124984825645791}, "ground_truth": 0}, {"key": "37675776", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.933702279624103, "res": {"Yes": 0.933702279624103, "No": 0.06629277911594825}, "ground_truth": 1}, {"key": "37675776", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988075053874662, "res": {"Yes": 0.9988075053874662, "No": 0.0011911900852006013}, "ground_truth": 0}, {"key": "37675776", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9928790563284463, "res": {"Yes": 0.9928790563284463, "No": 0.007119477080538282}, "ground_truth": 0}, {"key": "38107017", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977343155464535, "res": {"Yes": 0.9977343155464535, "No": 0.0022655847173671624}, "ground_truth": 0}, {"key": "38107017", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994366397470112, "res": {"Yes": 0.9994366397470112, "No": 0.0005631463595120179}, "ground_truth": 0}, {"key": "38107017", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999132028445421, "res": {"Yes": 0.999132028445421, "No": 0.0008670733349876324}, "ground_truth": 1}, {"key": "38107017", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999154137776163, "res": {"Yes": 0.9999154137776163, "No": 8.441630397154067e-05}, "ground_truth": 0}, {"key": "38107017", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982378374348327, "res": {"Yes": 0.9982378374348327, "No": 0.0017614011124881118}, "ground_truth": 0}, {"key": "40046472", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9173935753043073, "res": {"Yes": 0.9173935753043073, "No": 0.08259330954337224}, "ground_truth": 0}, {"key": "40046472", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.966403059435496, "res": {"Yes": 0.966403059435496, "No": 0.03351961798708073}, "ground_truth": 0}, {"key": "40046472", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9573097358190625, "res": {"Yes": 0.9573097358190625, "No": 0.04226084803123261}, "ground_truth": 1}, {"key": "40046472", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980816475945942, "res": {"Yes": 0.9980816475945942, "No": 0.0019145445835704459}, "ground_truth": 0}, {"key": "40046472", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8031027624982695, "res": {"Yes": 0.8031027624982695, "No": 0.19682906839739842}, "ground_truth": 0}, {"key": "32157820", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9006197874032429, "res": {"Yes": 0.9006197874032429, "No": 0.0993784986585959}, "ground_truth": 0}, {"key": "32157820", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9929379354050706, "res": {"Yes": 0.9929379354050706, "No": 0.007061768945563007}, "ground_truth": 0}, {"key": "32157820", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8525123952904691, "res": {"Yes": 0.8525123952904691, "No": 0.14748582640336327}, "ground_truth": 1}, {"key": "32157820", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9923338301297304, "res": {"Yes": 0.9923338301297304, "No": 0.0076658720710416905}, "ground_truth": 0}, {"key": "32157820", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9011211217982898, "res": {"Yes": 0.9011211217982898, "No": 0.09887630050097844}, "ground_truth": 0}, {"key": "41004037", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0021309386832018876, "res": {"No": 0.9978687834738286, "Yes": 0.0021309386832018876}, "ground_truth": 0}, {"key": "41004037", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993147247384162, "res": {"Yes": 0.9993147247384162, "No": 0.0006843534732951589}, "ground_truth": 0}, {"key": "41004037", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9962034674225453, "res": {"Yes": 0.9962034674225453, "No": 0.00379627559290165}, "ground_truth": 1}, {"key": "41004037", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9976323908184244, "res": {"Yes": 0.9976323908184244, "No": 0.00236711586381749}, "ground_truth": 0}, {"key": "41004037", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9955331246965261, "res": {"Yes": 0.9955331246965261, "No": 0.004465783071838213}, "ground_truth": 0}, {"key": "21387993", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9709218315203487, "res": {"Yes": 0.9709218315203487, "No": 0.029077930342946513}, "ground_truth": 0}, {"key": "21387993", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991409572886376, "res": {"Yes": 0.9991409572886376, "No": 0.0008588974724260097}, "ground_truth": 0}, {"key": "21387993", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999377109936612, "res": {"Yes": 0.999377109936612, "No": 0.0006226674312044153}, "ground_truth": 1}, {"key": "21387993", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994006794643402, "res": {"Yes": 0.9994006794643402, "No": 0.0005992002551162041}, "ground_truth": 0}, {"key": "21387993", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990844371436729, "res": {"Yes": 0.9990844371436729, "No": 0.0009154889168864957}, "ground_truth": 0}, {"key": "34665539", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4531133971457859, "res": {"No": 0.5468802619856125, "Yes": 0.4531133971457859}, "ground_truth": 0}, {"key": "34665539", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7666198214932056, "res": {"Yes": 0.7666198214932056, "No": 0.23337457458582617}, "ground_truth": 0}, {"key": "34665539", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9898510249749587, "res": {"Yes": 0.9898510249749587, "No": 0.010147857292166721}, "ground_truth": 1}, {"key": "34665539", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9764928390250234, "res": {"Yes": 0.9764928390250234, "No": 0.02350681264635431}, "ground_truth": 0}, {"key": "34665539", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.948897456953708, "res": {"Yes": 0.948897456953708, "No": 0.051100775794462594}, "ground_truth": 0}, {"key": "37872111", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7053672287097664, "res": {"Yes": 0.7053672287097664, "No": 0.2946145462204392}, "ground_truth": 0}, {"key": "37872111", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.46228046730748334, "res": {"No": 0.5377173116197033, "Yes": 0.46228046730748334}, "ground_truth": 0}, {"key": "37872111", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.33692824302887814, "res": {"No": 0.6630693791517422, "Yes": 0.33692824302887814}, "ground_truth": 1}, {"key": "37872111", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.855015749283848, "res": {"Yes": 0.855015749283848, "No": 0.14497880785022305}, "ground_truth": 0}, {"key": "37872111", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1478701729483712, "res": {"No": 0.8521229713477352, "Yes": 0.1478701729483712}, "ground_truth": 0}, {"key": "36629542", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9761085514555273, "res": {"Yes": 0.9761085514555273, "No": 0.02388718634522787}, "ground_truth": 0}, {"key": "36629542", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999390676113243, "res": {"Yes": 0.999390676113243, "No": 0.0006089112692295414}, "ground_truth": 0}, {"key": "36629542", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985000699212302, "res": {"Yes": 0.9985000699212302, "No": 0.0014983006696131574}, "ground_truth": 1}, {"key": "36629542", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997419123103592, "res": {"Yes": 0.9997419123103592, "No": 0.00025786664152293985}, "ground_truth": 0}, {"key": "36629542", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984386238181024, "res": {"Yes": 0.9984386238181024, "No": 0.0015608645695328737}, "ground_truth": 0}, {"key": "36487527", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9969262506700372, "res": {"Yes": 0.9969262506700372, "No": 0.003073088183562478}, "ground_truth": 0}, {"key": "36487527", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995727597931009, "res": {"Yes": 0.9995727597931009, "No": 0.00042652725039589727}, "ground_truth": 0}, {"key": "36487527", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999711531015181, "res": {"Yes": 0.999711531015181, "No": 0.00028732344233191553}, "ground_truth": 1}, {"key": "36487527", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993068663681752, "res": {"Yes": 0.9993068663681752, "No": 0.0006914412297408871}, "ground_truth": 0}, {"key": "36487527", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.989957921294243, "res": {"Yes": 0.989957921294243, "No": 0.010040057877941103}, "ground_truth": 0}, {"key": "37344756", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.810642464221325, "res": {"Yes": 0.810642464221325, "No": 0.18935697287289696}, "ground_truth": 0}, {"key": "37344756", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6766893459458062, "res": {"Yes": 0.6766893459458062, "No": 0.32330966495573}, "ground_truth": 0}, {"key": "37344756", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997783688938031, "res": {"Yes": 0.9997783688938031, "No": 0.00022113006503322972}, "ground_truth": 1}, {"key": "37344756", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9162120550078304, "res": {"Yes": 0.9162120550078304, "No": 0.0837865320335776}, "ground_truth": 0}, {"key": "37344756", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.31174070824952943, "res": {"No": 0.6882581454590215, "Yes": 0.31174070824952943}, "ground_truth": 0}, {"key": "38707722", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999132981228169, "res": {"Yes": 0.999132981228169, "No": 0.0008656992466184497}, "ground_truth": 0}, {"key": "38707722", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999120763555102, "res": {"Yes": 0.9999120763555102, "No": 8.738018650765218e-05}, "ground_truth": 0}, {"key": "38707722", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9887653770609663, "res": {"Yes": 0.9887653770609663, "No": 0.011233312330298985}, "ground_truth": 1}, {"key": "38707722", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9961900999560035, "res": {"Yes": 0.9961900999560035, "No": 0.0038094113617803014}, "ground_truth": 0}, {"key": "38707722", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.996685792948813, "res": {"Yes": 0.996685792948813, "No": 0.003313898460521911}, "ground_truth": 0}, {"key": "37093419", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9941988967583119, "res": {"Yes": 0.9941988967583119, "No": 0.005800698138306246}, "ground_truth": 0}, {"key": "37093419", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997317850906571, "res": {"Yes": 0.997317850906571, "No": 0.0026819600227348966}, "ground_truth": 1}, {"key": "37093419", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.597844052986382, "res": {"Yes": 0.597844052986382, "No": 0.4021536055450955}, "ground_truth": 0}, {"key": "37093419", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7853732629558534, "res": {"Yes": 0.7853732629558534, "No": 0.2146231026728417}, "ground_truth": 0}, {"key": "35547391", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9841770787904773, "res": {"Yes": 0.9841770787904773, "No": 0.015822172498443077}, "ground_truth": 0}, {"key": "35547391", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7681169183396391, "res": {"Yes": 0.7681169183396391, "No": 0.23187790903398675}, "ground_truth": 0}, {"key": "35547391", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.995144798182341, "res": {"Yes": 0.995144798182341, "No": 0.004853441199291201}, "ground_truth": 1}, {"key": "35547391", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996562526646581, "res": {"Yes": 0.9996562526646581, "No": 0.00034309952243939765}, "ground_truth": 0}, {"key": "35547391", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9979806137096249, "res": {"Yes": 0.9979806137096249, "No": 0.002018951422740646}, "ground_truth": 0}, {"key": "37173168", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.003700930516516873, "res": {"No": 0.996287232927033, "Yes": 0.003700930516516873}, "ground_truth": 0}, {"key": "37173168", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.43799823425285184, "res": {"No": 0.561856185231814, "Yes": 0.43799823425285184}, "ground_truth": 0}, {"key": "37173168", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3441012959445318, "res": {"No": 0.6558578799020935, "Yes": 0.3441012959445318}, "ground_truth": 1}, {"key": "37173168", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.532531887799465, "res": {"Yes": 0.532531887799465, "No": 0.4674581280187217}, "ground_truth": 0}, {"key": "37173168", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.23551419295896278, "res": {"No": 0.7644280284751365, "Yes": 0.23551419295896278}, "ground_truth": 0}, {"key": "30725298", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999293595151566, "res": {"Yes": 0.9999293595151566, "No": 7.052756017986836e-05}, "ground_truth": 0}, {"key": "30725298", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999506956924973, "res": {"Yes": 0.9999506956924973, "No": 4.916212735980677e-05}, "ground_truth": 0}, {"key": "30725298", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999772771531678, "res": {"Yes": 0.9999772771531678, "No": 2.1542237825761754e-05}, "ground_truth": 1}, {"key": "30725298", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998768031293578, "res": {"Yes": 0.9998768031293578, "No": 0.00012196163864656939}, "ground_truth": 0}, {"key": "30725298", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998808482291361, "res": {"Yes": 0.9998808482291361, "No": 0.0001190288092041839}, "ground_truth": 0}, {"key": "33830573", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.02170221391298324, "res": {"No": 0.9782969687604931, "Yes": 0.02170221391298324}, "ground_truth": 0}, {"key": "33830573", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8806717768096902, "res": {"Yes": 0.8806717768096902, "No": 0.1193242740396687}, "ground_truth": 0}, {"key": "33830573", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.06913062141408867, "res": {"No": 0.9308687305326795, "Yes": 0.06913062141408867}, "ground_truth": 1}, {"key": "33830573", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9069844259160821, "res": {"Yes": 0.9069844259160821, "No": 0.09301337304348999}, "ground_truth": 0}, {"key": "33830573", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5775135059114518, "res": {"Yes": 0.5775135059114518, "No": 0.42247922710880687}, "ground_truth": 0}, {"key": "33415474", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8454339188465448, "res": {"Yes": 0.8454339188465448, "No": 0.15456519461982238}, "ground_truth": 0}, {"key": "33415474", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9954801985848725, "res": {"Yes": 0.9954801985848725, "No": 0.004519684899807457}, "ground_truth": 0}, {"key": "33415474", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991263189817056, "res": {"Yes": 0.9991263189817056, "No": 0.0008730859092815972}, "ground_truth": 1}, {"key": "33415474", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8052923256730352, "res": {"Yes": 0.8052923256730352, "No": 0.19470501682242844}, "ground_truth": 0}, {"key": "33415474", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9870331642986891, "res": {"Yes": 0.9870331642986891, "No": 0.012965240632522985}, "ground_truth": 0}, {"key": "37383994", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9870362961598882, "res": {"Yes": 0.9870362961598882, "No": 0.012963598040595239}, "ground_truth": 0}, {"key": "37383994", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9940225425112219, "res": {"Yes": 0.9940225425112219, "No": 0.005977224196334576}, "ground_truth": 0}, {"key": "37383994", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991911790221687, "res": {"Yes": 0.9991911790221687, "No": 0.0008084740305458257}, "ground_truth": 1}, {"key": "37383994", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998016356326763, "res": {"Yes": 0.998016356326763, "No": 0.001983359212219373}, "ground_truth": 0}, {"key": "37383994", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999054015547151, "res": {"Yes": 0.9999054015547151, "No": 9.417837193843223e-05}, "ground_truth": 0}, {"key": "38576819", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9997347656408535, "res": {"Yes": 0.9997347656408535, "No": 0.00026508394726787395}, "ground_truth": 0}, {"key": "38576819", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988871956265115, "res": {"Yes": 0.9988871956265115, "No": 0.0011126641547250338}, "ground_truth": 0}, {"key": "38576819", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9913668891765915, "res": {"Yes": 0.9913668891765915, "No": 0.008631983176475446}, "ground_truth": 1}, {"key": "38576819", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9976587295590928, "res": {"Yes": 0.9976587295590928, "No": 0.0023408047464412605}, "ground_truth": 0}, {"key": "38576819", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999447358231209, "res": {"Yes": 0.9999447358231209, "No": 5.4947630448541e-05}, "ground_truth": 0}, {"key": "34500226", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999087389545426, "res": {"Yes": 0.9999087389545426, "No": 9.109077692882955e-05}, "ground_truth": 0}, {"key": "34500226", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994767712319385, "res": {"Yes": 0.9994767712319385, "No": 0.0005229467058249076}, "ground_truth": 0}, {"key": "34500226", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990141206986459, "res": {"Yes": 0.9990141206986459, "No": 0.0009855371849681281}, "ground_truth": 1}, {"key": "34500226", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9973103758378286, "res": {"Yes": 0.9973103758378286, "No": 0.0026893157116911364}, "ground_truth": 0}, {"key": "34500226", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999343776239055, "res": {"Yes": 0.999343776239055, "No": 0.0006558997505380485}, "ground_truth": 0}, {"key": "39856394", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004951857600353878, "res": {"No": 0.9950477749013452, "Yes": 0.004951857600353878}, "ground_truth": 0}, {"key": "39856394", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994723667474078, "res": {"Yes": 0.9994723667474078, "No": 0.0005268187481421274}, "ground_truth": 0}, {"key": "39856394", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9989967524896284, "res": {"Yes": 0.9989967524896284, "No": 0.0010028593591736078}, "ground_truth": 1}, {"key": "39856394", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995703767345164, "res": {"Yes": 0.9995703767345164, "No": 0.00042904103110861093}, "ground_truth": 0}, {"key": "39856394", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9961263297921261, "res": {"Yes": 0.9961263297921261, "No": 0.003872387643649642}, "ground_truth": 0}, {"key": "35499522", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 1.2165847622531867e-06, "res": {"No": 0.9999980183344636, "Yes": 1.2165847622531867e-06}, "ground_truth": 0}, {"key": "35499522", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9836538571548261, "res": {"Yes": 0.9836538571548261, "No": 0.016345698580711606}, "ground_truth": 0}, {"key": "35499522", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997893295841292, "res": {"Yes": 0.9997893295841292, "No": 0.00021036551344863637}, "ground_truth": 1}, {"key": "35499522", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990427841936136, "res": {"Yes": 0.9990427841936136, "No": 0.0009562750280900255}, "ground_truth": 0}, {"key": "35499522", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996809123193061, "res": {"Yes": 0.9996809123193061, "No": 0.00031893571368074304}, "ground_truth": 0}, {"key": "30157766", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9627809425959074, "res": {"Yes": 0.9627809425959074, "No": 0.037215616775642286}, "ground_truth": 0}, {"key": "30157766", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7892514139773971, "res": {"Yes": 0.7892514139773971, "No": 0.2107461184633563}, "ground_truth": 0}, {"key": "30157766", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9751228489484501, "res": {"Yes": 0.9751228489484501, "No": 0.024875925266152794}, "ground_truth": 1}, {"key": "30157766", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9829845157437316, "res": {"Yes": 0.9829845157437316, "No": 0.017012639690288444}, "ground_truth": 0}, {"key": "30157766", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5799338695264904, "res": {"Yes": 0.5799338695264904, "No": 0.4200596432704872}, "ground_truth": 0}, {"key": "40472346", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.16848239758795308, "res": {"No": 0.8315137035232413, "Yes": 0.16848239758795308}, "ground_truth": 0}, {"key": "40472346", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.727651415733809, "res": {"Yes": 0.727651415733809, "No": 0.2723425581794445}, "ground_truth": 0}, {"key": "40472346", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9798399960344629, "res": {"Yes": 0.9798399960344629, "No": 0.020158519015704365}, "ground_truth": 1}, {"key": "40472346", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3868606609540412, "res": {"No": 0.6131286595471225, "Yes": 0.3868606609540412}, "ground_truth": 0}, {"key": "40472346", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.05665896792368945, "res": {"No": 0.9433379660669379, "Yes": 0.05665896792368945}, "ground_truth": 0}, {"key": "35305635", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.006685078672405648, "res": {"No": 0.9933087696468418, "Yes": 0.006685078672405648}, "ground_truth": 0}, {"key": "35305635", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.02457052316104281, "res": {"No": 0.9754270674389677, "Yes": 0.02457052316104281}, "ground_truth": 0}, {"key": "35305635", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.19278920288647663, "res": {"No": 0.8072018322998576, "Yes": 0.19278920288647663}, "ground_truth": 1}, {"key": "35305635", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06476963377767951, "res": {"No": 0.9352199001681905, "Yes": 0.06476963377767951}, "ground_truth": 0}, {"key": "35305635", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0018809458818940898, "res": {"No": 0.99811871004853, "Yes": 0.0018809458818940898}, "ground_truth": 0}, {"key": "32495926", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9109335465427669, "res": {"Yes": 0.9109335465427669, "No": 0.08906498563717342}, "ground_truth": 0}, {"key": "32495926", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997097471315166, "res": {"Yes": 0.9997097471315166, "No": 0.0002900452826803022}, "ground_truth": 0}, {"key": "32495926", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9975609746676114, "res": {"Yes": 0.9975609746676114, "No": 0.0024387028497290333}, "ground_truth": 1}, {"key": "32495926", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9948237959532116, "res": {"Yes": 0.9948237959532116, "No": 0.005176156947931049}, "ground_truth": 0}, {"key": "32495926", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9936579989224894, "res": {"Yes": 0.9936579989224894, "No": 0.006341273900744991}, "ground_truth": 0}, {"key": "37353801", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9979030910917147, "res": {"Yes": 0.9979030910917147, "No": 0.002096165616791738}, "ground_truth": 0}, {"key": "37353801", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9987178506567236, "res": {"Yes": 0.9987178506567236, "No": 0.0012815455096412986}, "ground_truth": 0}, {"key": "37353801", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991911790221687, "res": {"Yes": 0.9991911790221687, "No": 0.0008080517940100546}, "ground_truth": 1}, {"key": "37353801", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999754187196919, "res": {"Yes": 0.999754187196919, "No": 0.00024531781107006213}, "ground_truth": 0}, {"key": "37353801", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999776347571058, "res": {"Yes": 0.9999776347571058, "No": 2.1958263940078065e-05}, "ground_truth": 0}, {"key": "30159904", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2742627473887451, "res": {"No": 0.7257353008645295, "Yes": 0.2742627473887451}, "ground_truth": 0}, {"key": "30159904", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.4380553967521938, "res": {"No": 0.5619402508240564, "Yes": 0.4380553967521938}, "ground_truth": 0}, {"key": "30159904", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.014068106415965287, "res": {"No": 0.9859232255153506, "Yes": 0.014068106415965287}, "ground_truth": 1}, {"key": "30159904", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.25560144580005945, "res": {"No": 0.7443681509422807, "Yes": 0.25560144580005945}, "ground_truth": 0}, {"key": "30159904", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.08464333580195157, "res": {"No": 0.915349389631197, "Yes": 0.08464333580195157}, "ground_truth": 0}, {"key": "33698679", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996643557411417, "res": {"Yes": 0.9996643557411417, "No": 0.00033524397755687767}, "ground_truth": 0}, {"key": "33698679", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996913989471037, "res": {"Yes": 0.9996913989471037, "No": 0.00030816906908333504}, "ground_truth": 0}, {"key": "33698679", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999100500717374, "res": {"Yes": 0.9999100500717374, "No": 8.953615927763537e-05}, "ground_truth": 1}, {"key": "33698679", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999783493530909, "res": {"Yes": 0.999783493530909, "No": 0.0002162963715990714}, "ground_truth": 0}, {"key": "33698679", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996548227073943, "res": {"Yes": 0.9996548227073943, "No": 0.00034482966068712464}, "ground_truth": 0}, {"key": "40530172", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0037431323176127036, "res": {"No": 0.9962506713508971, "Yes": 0.0037431323176127036}, "ground_truth": 0}, {"key": "40530172", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.018946866828293742, "res": {"No": 0.9810522734055218, "Yes": 0.018946866828293742}, "ground_truth": 0}, {"key": "40530172", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9014167019479785, "res": {"Yes": 0.9014167019479785, "No": 0.09858288623840057}, "ground_truth": 1}, {"key": "40530172", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5300459913864274, "res": {"Yes": 0.5300459913864274, "No": 0.46995313594725563}, "ground_truth": 0}, {"key": "40530172", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9917669308916173, "res": {"Yes": 0.9917669308916173, "No": 0.008232636197250091}, "ground_truth": 0}, {"key": "40652941", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.000567002412157239, "res": {"No": 0.9994323545216897, "Yes": 0.000567002412157239}, "ground_truth": 0}, {"key": "40652941", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9952907471670075, "res": {"Yes": 0.9952907471670075, "No": 0.004708918571360912}, "ground_truth": 0}, {"key": "40652941", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7553423037723203, "res": {"Yes": 0.7553423037723203, "No": 0.244646320796745}, "ground_truth": 1}, {"key": "40652941", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9814831804393239, "res": {"Yes": 0.9814831804393239, "No": 0.018510937599609124}, "ground_truth": 0}, {"key": "40652941", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.998628795361346, "res": {"Yes": 0.998628795361346, "No": 0.0013701783022264796}, "ground_truth": 0}, {"key": "40122246", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7305512009258641, "res": {"Yes": 0.7305512009258641, "No": 0.2694456173243221}, "ground_truth": 0}, {"key": "40122246", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.842978875511058, "res": {"Yes": 0.842978875511058, "No": 0.15701882128857672}, "ground_truth": 0}, {"key": "40122246", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4145510008989817, "res": {"No": 0.5854430312471159, "Yes": 0.4145510008989817}, "ground_truth": 1}, {"key": "40122246", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.978902150366433, "res": {"Yes": 0.978902150366433, "No": 0.02109638669177158}, "ground_truth": 0}, {"key": "40122246", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6142453855138692, "res": {"Yes": 0.6142453855138692, "No": 0.3857539685156814}, "ground_truth": 0}, {"key": "40032656", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.15378517776413014, "res": {"No": 0.8462106120036398, "Yes": 0.15378517776413014}, "ground_truth": 0}, {"key": "40032656", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.03261814338080418, "res": {"No": 0.9673746434174314, "Yes": 0.03261814338080418}, "ground_truth": 0}, {"key": "40032656", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1703798879526017, "res": {"No": 0.8296152499027953, "Yes": 0.1703798879526017}, "ground_truth": 1}, {"key": "40032656", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6334203608927178, "res": {"Yes": 0.6334203608927178, "No": 0.36653407056425075}, "ground_truth": 0}, {"key": "40032656", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.985584991597433, "res": {"Yes": 0.985584991597433, "No": 0.014405632543857063}, "ground_truth": 0}, {"key": "38913680", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9377465959925648, "res": {"Yes": 0.9377465959925648, "No": 0.06221836908041215}, "ground_truth": 0}, {"key": "38913680", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0037479434603696067, "res": {"No": 0.9962421504553446, "Yes": 0.0037479434603696067}, "ground_truth": 0}, {"key": "38913680", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.4109997066524965e-05, "res": {"No": 0.999975489140396, "Yes": 1.4109997066524965e-05}, "ground_truth": 1}, {"key": "38913680", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004402950476252633, "res": {"No": 0.9955916169724829, "Yes": 0.004402950476252633}, "ground_truth": 0}, {"key": "38913680", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0012552322045089766, "res": {"No": 0.9987385401102727, "Yes": 0.0012552322045089766}, "ground_truth": 0}, {"key": "17608039", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9521879911404472, "res": {"Yes": 0.9521879911404472, "No": 0.04781145613998685}, "ground_truth": 0}, {"key": "17608039", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8800247912779009, "res": {"Yes": 0.8800247912779009, "No": 0.1199679566230144}, "ground_truth": 0}, {"key": "17608039", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6724312656106977, "res": {"Yes": 0.6724312656106977, "No": 0.32756561265115886}, "ground_truth": 1}, {"key": "17608039", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.848959072964, "res": {"Yes": 0.848959072964, "No": 0.15103699079736724}, "ground_truth": 0}, {"key": "17608039", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9651515068978366, "res": {"Yes": 0.9651515068978366, "No": 0.03484747492236223}, "ground_truth": 0}, {"key": "40434901", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 9.390931268910062e-05, "res": {"No": 0.9999059975285092, "Yes": 9.390931268910062e-05}, "ground_truth": 0}, {"key": "40434901", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0022532530656112484, "res": {"No": 0.9977465438531599, "Yes": 0.0022532530656112484}, "ground_truth": 0}, {"key": "40434901", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9619704346507346, "res": {"Yes": 0.9619704346507346, "No": 0.03802848860533992}, "ground_truth": 1}, {"key": "40434901", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8434454669541038, "res": {"Yes": 0.8434454669541038, "No": 0.15655291674305316}, "ground_truth": 0}, {"key": "40434901", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.977574941074929, "res": {"Yes": 0.977574941074929, "No": 0.022423120214302285}, "ground_truth": 0}, {"key": "37680058", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.998314578620528, "res": {"Yes": 0.998314578620528, "No": 0.0016846955735780583}, "ground_truth": 0}, {"key": "37680058", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988975438517942, "res": {"Yes": 0.9988975438517942, "No": 0.0011023375593022685}, "ground_truth": 0}, {"key": "37680058", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998651226767641, "res": {"Yes": 0.9998651226767641, "No": 0.00013459100104627574}, "ground_truth": 1}, {"key": "37680058", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994474775967512, "res": {"Yes": 0.9994474775967512, "No": 0.0005521548641709123}, "ground_truth": 0}, {"key": "37680058", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9923442744982559, "res": {"Yes": 0.9923442744982559, "No": 0.007653359325619576}, "ground_truth": 0}, {"key": "37291821", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.008331298105086765, "res": {"No": 0.9916683214329762, "Yes": 0.008331298105086765}, "ground_truth": 0}, {"key": "37291821", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992869880139392, "res": {"Yes": 0.9992869880139392, "No": 0.0007123069712999437}, "ground_truth": 0}, {"key": "37291821", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994535499582378, "res": {"Yes": 0.9994535499582378, "No": 0.000545423773169393}, "ground_truth": 1}, {"key": "37291821", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999075470290394, "res": {"Yes": 0.9999075470290394, "No": 9.18629284577383e-05}, "ground_truth": 0}, {"key": "37291821", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9955942170629449, "res": {"Yes": 0.9955942170629449, "No": 0.004404978061366176}, "ground_truth": 0}, {"key": "41002743", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995754929286346, "res": {"Yes": 0.9995754929286346, "No": 0.0004242922802524962}, "ground_truth": 0}, {"key": "41002743", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995208251609505, "res": {"Yes": 0.9995208251609505, "No": 0.0004786298571909879}, "ground_truth": 0}, {"key": "41002743", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998828744557322, "res": {"Yes": 0.9998828744557322, "No": 0.00011681804554206332}, "ground_truth": 1}, {"key": "41002743", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999947998470209, "res": {"Yes": 0.9999947998470209, "No": 4.946303638646456e-06}, "ground_truth": 0}, {"key": "41002743", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999975415208221, "res": {"Yes": 0.9999975415208221, "No": 2.1341779938734684e-06}, "ground_truth": 0}, {"key": "36322869", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7320599496099981, "res": {"Yes": 0.7320599496099981, "No": 0.2679397599615832}, "ground_truth": 0}, {"key": "36322869", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.998903720953415, "res": {"Yes": 0.998903720953415, "No": 0.0010939203323316233}, "ground_truth": 0}, {"key": "36322869", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8574442385384062, "res": {"Yes": 0.8574442385384062, "No": 0.14255127777025037}, "ground_truth": 1}, {"key": "36322869", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9970274395327277, "res": {"Yes": 0.9970274395327277, "No": 0.0029716913801453634}, "ground_truth": 0}, {"key": "36322869", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.992466613080703, "res": {"Yes": 0.992466613080703, "No": 0.007532417044731626}, "ground_truth": 0}, {"key": "39459717", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6084130129615783, "res": {"Yes": 0.6084130129615783, "No": 0.39158068219286996}, "ground_truth": 0}, {"key": "39459717", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8556976139336168, "res": {"Yes": 0.8556976139336168, "No": 0.14429516793599922}, "ground_truth": 0}, {"key": "39459717", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9649085991844681, "res": {"Yes": 0.9649085991844681, "No": 0.03508959258595546}, "ground_truth": 1}, {"key": "39459717", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8650115323003473, "res": {"Yes": 0.8650115323003473, "No": 0.13498565033609478}, "ground_truth": 0}, {"key": "39459717", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 1.6906085586023123e-06, "res": {"No": 0.9999981375378344, "Yes": 1.6906085586023123e-06}, "ground_truth": 0}, {"key": "36503727", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996580401016186, "res": {"Yes": 0.9996580401016186, "No": 0.0003413990261933718}, "ground_truth": 0}, {"key": "36503727", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998745385409472, "res": {"Yes": 0.9998745385409472, "No": 0.00012487547714773177}, "ground_truth": 0}, {"key": "36503727", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999437822452772, "res": {"Yes": 0.9999437822452772, "No": 5.555055782915904e-05}, "ground_truth": 1}, {"key": "36503727", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998244842046997, "res": {"Yes": 0.9998244842046997, "No": 0.00017485963353081207}, "ground_truth": 0}, {"key": "36503727", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995235655809392, "res": {"Yes": 0.9995235655809392, "No": 0.00047479045435057246}, "ground_truth": 0}, {"key": "35682367", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999204865387198, "res": {"Yes": 0.999204865387198, "No": 0.0007950862171061538}, "ground_truth": 0}, {"key": "35682367", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998869269092439, "res": {"Yes": 0.9998869269092439, "No": 0.0001127305612736774}, "ground_truth": 0}, {"key": "35682367", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9693762893193691, "res": {"Yes": 0.9693762893193691, "No": 0.030622844385708264}, "ground_truth": 1}, {"key": "35682367", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997563213444676, "res": {"Yes": 0.9997563213444676, "No": 0.00024303988312617775}, "ground_truth": 0}, {"key": "35682367", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999084675265486, "res": {"Yes": 0.999084675265486, "No": 0.0009150459274628107}, "ground_truth": 0}, {"key": "36472353", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7973744549305979, "res": {"Yes": 0.7973744549305979, "No": 0.2026124374218916}, "ground_truth": 0}, {"key": "36472353", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9184627136311475, "res": {"Yes": 0.9184627136311475, "No": 0.08153251347063843}, "ground_truth": 0}, {"key": "36472353", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.992489500815669, "res": {"Yes": 0.992489500815669, "No": 0.007464966019330034}, "ground_truth": 1}, {"key": "36472353", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998234115535755, "res": {"Yes": 0.9998234115535755, "No": 0.0001757039643236266}, "ground_truth": 0}, {"key": "36472353", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7580188693864022, "res": {"Yes": 0.7580188693864022, "No": 0.2418498499836706}, "ground_truth": 0}, {"key": "37651907", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9973779660517363, "res": {"Yes": 0.9973779660517363, "No": 0.002621509453019391}, "ground_truth": 0}, {"key": "37651907", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9971090925438996, "res": {"Yes": 0.9971090925438996, "No": 0.00289047046340827}, "ground_truth": 0}, {"key": "37651907", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996245705712715, "res": {"Yes": 0.9996245705712715, "No": 0.00037488809119912787}, "ground_truth": 1}, {"key": "37651907", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988128560136041, "res": {"Yes": 0.9988128560136041, "No": 0.0011869147329646025}, "ground_truth": 0}, {"key": "37651907", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975033272846225, "res": {"Yes": 0.9975033272846225, "No": 0.0024959621321607468}, "ground_truth": 0}, {"key": "36255476", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9320281172765038, "res": {"Yes": 0.9320281172765038, "No": 0.06797148499919721}, "ground_truth": 0}, {"key": "36255476", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8230436434522292, "res": {"Yes": 0.8230436434522292, "No": 0.17693486650131485}, "ground_truth": 0}, {"key": "36255476", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6453134378931484, "res": {"Yes": 0.6453134378931484, "No": 0.3546806400101144}, "ground_truth": 1}, {"key": "36255476", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974416516654202, "res": {"Yes": 0.9974416516654202, "No": 0.0025575385165942273}, "ground_truth": 0}, {"key": "36255476", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990720550074856, "res": {"Yes": 0.9990720550074856, "No": 0.0009278569367939079}, "ground_truth": 0}, {"key": "37283518", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.01288368753474892, "res": {"No": 0.9871157429474311, "Yes": 0.01288368753474892}, "ground_truth": 0}, {"key": "37283518", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999264988413425, "res": {"Yes": 0.9999264988413425, "No": 7.32375712669602e-05}, "ground_truth": 0}, {"key": "37283518", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999249493064443, "res": {"Yes": 0.9999249493064443, "No": 7.443531982073217e-05}, "ground_truth": 1}, {"key": "37283518", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999844292352256, "res": {"Yes": 0.9999844292352256, "No": 1.504901526209695e-05}, "ground_truth": 0}, {"key": "37283518", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999980257181892, "res": {"Yes": 0.999980257181892, "No": 1.9636882496395963e-05}, "ground_truth": 0}, {"key": "34906785", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9947273037197286, "res": {"Yes": 0.9947273037197286, "No": 0.0052721201069224595}, "ground_truth": 0}, {"key": "34906785", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997702648631589, "res": {"Yes": 0.9997702648631589, "No": 0.00022905440642188477}, "ground_truth": 0}, {"key": "34906785", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988850524164439, "res": {"Yes": 0.9988850524164439, "No": 0.0011144496314648995}, "ground_truth": 1}, {"key": "34906785", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989395296964828, "res": {"Yes": 0.9989395296964828, "No": 0.001059909554968504}, "ground_truth": 0}, {"key": "34906785", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991153765602249, "res": {"Yes": 0.9991153765602249, "No": 0.0008839038219011496}, "ground_truth": 0}, {"key": "34965328", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9489985834972837, "res": {"Yes": 0.9489985834972837, "No": 0.05099949746162432}, "ground_truth": 0}, {"key": "34965328", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9967786471269394, "res": {"Yes": 0.9967786471269394, "No": 0.0032200416008198686}, "ground_truth": 0}, {"key": "34965328", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9756041596164143, "res": {"Yes": 0.9756041596164143, "No": 0.024393792128904922}, "ground_truth": 1}, {"key": "34965328", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9894169408383622, "res": {"Yes": 0.9894169408383622, "No": 0.010581285046034464}, "ground_truth": 0}, {"key": "34965328", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9882981287545504, "res": {"Yes": 0.9882981287545504, "No": 0.011697209147897602}, "ground_truth": 0}, {"key": "38788440", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999223666542873, "res": {"Yes": 0.999223666542873, "No": 0.0007761817898082881}, "ground_truth": 0}, {"key": "38788440", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9917005610941589, "res": {"Yes": 0.9917005610941589, "No": 0.008299023680116776}, "ground_truth": 0}, {"key": "38788440", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997914747944036, "res": {"Yes": 0.9997914747944036, "No": 0.00020822611028840912}, "ground_truth": 1}, {"key": "38788440", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989246597931071, "res": {"Yes": 0.9989246597931071, "No": 0.0010747875122109599}, "ground_truth": 0}, {"key": "38788440", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985086287011107, "res": {"Yes": 0.9985086287011107, "No": 0.0014906515093431247}, "ground_truth": 0}, {"key": "35046866", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6312258667591374, "res": {"Yes": 0.6312258667591374, "No": 0.3687628774645874}, "ground_truth": 0}, {"key": "35046866", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993119885884663, "res": {"Yes": 0.9993119885884663, "No": 0.0006871011790146208}, "ground_truth": 0}, {"key": "35046866", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998441361340874, "res": {"Yes": 0.998441361340874, "No": 0.0015582038488639576}, "ground_truth": 1}, {"key": "35046866", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989596355547316, "res": {"Yes": 0.9989596355547316, "No": 0.0010399811406330095}, "ground_truth": 0}, {"key": "35046866", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.950256797269729, "res": {"Yes": 0.950256797269729, "No": 0.049741056519006656}, "ground_truth": 0}, {"key": "37629558", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999744163342675, "res": {"Yes": 0.9999744163342675, "No": 2.5431830479900992e-05}, "ground_truth": 0}, {"key": "37629558", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981248858273426, "res": {"Yes": 0.9981248858273426, "No": 0.001874711121430395}, "ground_truth": 0}, {"key": "37629558", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998808482291361, "res": {"Yes": 0.9998808482291361, "No": 0.00011876212678128389}, "ground_truth": 1}, {"key": "37629558", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999249493064443, "res": {"Yes": 0.9999249493064443, "No": 7.464089579175123e-05}, "ground_truth": 0}, {"key": "37629558", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998660761785957, "res": {"Yes": 0.9998660761785957, "No": 0.00013382681758131504}, "ground_truth": 0}, {"key": "33859914", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9886906707489717, "res": {"Yes": 0.9886906707489717, "No": 0.011308518360997697}, "ground_truth": 0}, {"key": "33859914", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6193486361816087, "res": {"Yes": 0.6193486361816087, "No": 0.380639197774445}, "ground_truth": 0}, {"key": "33859914", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8835457286893628, "res": {"Yes": 0.8835457286893628, "No": 0.11644949724588588}, "ground_truth": 1}, {"key": "33859914", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9957984383618281, "res": {"Yes": 0.9957984383618281, "No": 0.004200385383189717}, "ground_truth": 0}, {"key": "33859914", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7740710219319981, "res": {"Yes": 0.7740710219319981, "No": 0.22591810785501024}, "ground_truth": 0}, {"key": "39790523", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9941826298090434, "res": {"Yes": 0.9941826298090434, "No": 0.005817288612108833}, "ground_truth": 0}, {"key": "39790523", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9861899247286263, "res": {"Yes": 0.9861899247286263, "No": 0.013809686676210962}, "ground_truth": 0}, {"key": "39790523", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994247334992588, "res": {"Yes": 0.9994247334992588, "No": 0.0005751785750948628}, "ground_truth": 1}, {"key": "39790523", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990667031926357, "res": {"Yes": 0.9990667031926357, "No": 0.0009332226936627523}, "ground_truth": 0}, {"key": "39790523", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9945167959421559, "res": {"Yes": 0.9945167959421559, "No": 0.005482858993090891}, "ground_truth": 0}, {"key": "33509656", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999783255162557, "res": {"Yes": 0.999783255162557, "No": 0.0002166598382518555}, "ground_truth": 0}, {"key": "33509656", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6661769453637936, "res": {"Yes": 0.6661769453637936, "No": 0.33382292208341446}, "ground_truth": 0}, {"key": "33509656", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997203495794703, "res": {"Yes": 0.9997203495794703, "No": 0.0002795364115421991}, "ground_truth": 1}, {"key": "33509656", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999478349506435, "res": {"Yes": 0.9999478349506435, "No": 5.209023785427469e-05}, "ground_truth": 0}, {"key": "33509656", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994772477825765, "res": {"Yes": 0.9994772477825765, "No": 0.0005227213643592713}, "ground_truth": 0}, {"key": "17380923", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.03517562527571318, "res": {"No": 0.9648239254159418, "Yes": 0.03517562527571318}, "ground_truth": 0}, {"key": "17380923", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999736672396801, "res": {"Yes": 0.999736672396801, "No": 0.0002630866795626433}, "ground_truth": 0}, {"key": "17380923", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980963749968089, "res": {"Yes": 0.9980963749968089, "No": 0.0019034382936069676}, "ground_truth": 1}, {"key": "17380923", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989001598679974, "res": {"Yes": 0.9989001598679974, "No": 0.0010991824530566668}, "ground_truth": 0}, {"key": "17380923", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9938783875894422, "res": {"Yes": 0.9938783875894422, "No": 0.006120625388593688}, "ground_truth": 0}, {"key": "36202526", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9545114596204824, "res": {"Yes": 0.9545114596204824, "No": 0.045486459077955274}, "ground_truth": 0}, {"key": "36202526", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9212969255047281, "res": {"Yes": 0.9212969255047281, "No": 0.07870082820843378}, "ground_truth": 0}, {"key": "36202526", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983605605514686, "res": {"Yes": 0.9983605605514686, "No": 0.0016391858390772548}, "ground_truth": 1}, {"key": "36202526", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.802135237515683, "res": {"Yes": 0.802135237515683, "No": 0.19786268479778088}, "ground_truth": 0}, {"key": "36202526", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9884081779246484, "res": {"Yes": 0.9884081779246484, "No": 0.011591101353022576}, "ground_truth": 0}, {"key": "26419232", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5543500292496002, "res": {"Yes": 0.5543500292496002, "No": 0.44563502124460264}, "ground_truth": 0}, {"key": "26419232", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990607522695415, "res": {"Yes": 0.9990607522695415, "No": 0.000938948148683555}, "ground_truth": 0}, {"key": "26419232", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9813146232155516, "res": {"Yes": 0.9813146232155516, "No": 0.018681398178992833}, "ground_truth": 1}, {"key": "26419232", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9895838601552763, "res": {"Yes": 0.9895838601552763, "No": 0.010413790933148842}, "ground_truth": 0}, {"key": "26419232", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8991238543308147, "res": {"Yes": 0.8991238543308147, "No": 0.10084158084702938}, "ground_truth": 0}, {"key": "34232398", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5746341508930957, "res": {"Yes": 0.5746341508930957, "No": 0.4253637473471026}, "ground_truth": 0}, {"key": "34232398", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9425204804270384, "res": {"Yes": 0.9425204804270384, "No": 0.057476793726922416}, "ground_truth": 0}, {"key": "34232398", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8158090245100172, "res": {"Yes": 0.8158090245100172, "No": 0.18419067145686668}, "ground_truth": 1}, {"key": "34232398", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9700682006576475, "res": {"Yes": 0.9700682006576475, "No": 0.02992957072060622}, "ground_truth": 0}, {"key": "34232398", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9904186623343352, "res": {"Yes": 0.9904186623343352, "No": 0.009580910976764284}, "ground_truth": 0}, {"key": "33586045", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0038617956862012554, "res": {"No": 0.9961379300496185, "Yes": 0.0038617956862012554}, "ground_truth": 0}, {"key": "33586045", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8876159928531531, "res": {"Yes": 0.8876159928531531, "No": 0.11238247163401839}, "ground_truth": 0}, {"key": "33586045", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8647252003329262, "res": {"Yes": 0.8647252003329262, "No": 0.13527338150563262}, "ground_truth": 1}, {"key": "33586045", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9955617194069087, "res": {"Yes": 0.9955617194069087, "No": 0.004437214785217732}, "ground_truth": 0}, {"key": "33586045", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.13561826702161217, "res": {"No": 0.8643771839007509, "Yes": 0.13561826702161217}, "ground_truth": 0}, {"key": "32281151", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.16675053263143352, "res": {"No": 0.833248659963668, "Yes": 0.16675053263143352}, "ground_truth": 0}, {"key": "32281151", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986217867094659, "res": {"Yes": 0.9986217867094659, "No": 0.0013775799206493526}, "ground_truth": 0}, {"key": "32281151", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9754243518537921, "res": {"Yes": 0.9754243518537921, "No": 0.024574022252670358}, "ground_truth": 1}, {"key": "32281151", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.37624185913636576, "res": {"No": 0.6237491217084783, "Yes": 0.37624185913636576}, "ground_truth": 0}, {"key": "32281151", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.4080307662277566, "res": {"No": 0.5919671118196685, "Yes": 0.4080307662277566}, "ground_truth": 0}, {"key": "37308159", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.17479281862249244, "res": {"No": 0.8252035547918719, "Yes": 0.17479281862249244}, "ground_truth": 0}, {"key": "37308159", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.004654508310187694, "res": {"No": 0.9953416459452508, "Yes": 0.004654508310187694}, "ground_truth": 0}, {"key": "37308159", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.007938967896647607, "res": {"No": 0.9920592159310183, "Yes": 0.007938967896647607}, "ground_truth": 1}, {"key": "37308159", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.015242297278876833, "res": {"No": 0.9847561351407336, "Yes": 0.015242297278876833}, "ground_truth": 0}, {"key": "37308159", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0003509959756320121, "res": {"No": 0.9996480341545159, "Yes": 0.0003509959756320121}, "ground_truth": 0}, {"key": "35694408", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9975284734634505, "res": {"Yes": 0.9975284734634505, "No": 0.0024712578671861082}, "ground_truth": 0}, {"key": "35694408", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993169880589199, "res": {"Yes": 0.9993169880589199, "No": 0.0006816428620249733}, "ground_truth": 0}, {"key": "35694408", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994041343484907, "res": {"Yes": 0.9994041343484907, "No": 0.0005949566572678192}, "ground_truth": 1}, {"key": "35694408", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988329593222661, "res": {"Yes": 0.9988329593222661, "No": 0.0011662031244594917}, "ground_truth": 0}, {"key": "35694408", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998221005559831, "res": {"Yes": 0.9998221005559831, "No": 0.00017708087656593662}, "ground_truth": 0}, {"key": "39781995", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9919022558114896, "res": {"Yes": 0.9919022558114896, "No": 0.00809736158995783}, "ground_truth": 0}, {"key": "39781995", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997817058596339, "res": {"Yes": 0.9997817058596339, "No": 0.00021785932535615566}, "ground_truth": 0}, {"key": "39781995", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993334160258753, "res": {"Yes": 0.9993334160258753, "No": 0.0006658993666279831}, "ground_truth": 1}, {"key": "39781995", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9979162695867441, "res": {"Yes": 0.9979162695867441, "No": 0.002083629404164946}, "ground_truth": 0}, {"key": "39781995", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990268372303225, "res": {"Yes": 0.9990268372303225, "No": 0.0009730500872213838}, "ground_truth": 0}, {"key": "22799372", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9933201823335135, "res": {"Yes": 0.9933201823335135, "No": 0.0066793426631206534}, "ground_truth": 0}, {"key": "22799372", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9916761764688602, "res": {"Yes": 0.9916761764688602, "No": 0.008321678514212576}, "ground_truth": 0}, {"key": "22799372", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998859733865285, "res": {"Yes": 0.9998859733865285, "No": 0.00011338981335800547}, "ground_truth": 1}, {"key": "22799372", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999094541095266, "res": {"Yes": 0.9999094541095266, "No": 9.034652528948483e-05}, "ground_truth": 0}, {"key": "22799372", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9962593112726836, "res": {"Yes": 0.9962593112726836, "No": 0.0037401670603893654}, "ground_truth": 0}, {"key": "37428240", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999314843826759, "res": {"Yes": 0.999314843826759, "No": 0.0006850381690592778}, "ground_truth": 0}, {"key": "37428240", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990818169882272, "res": {"Yes": 0.9990818169882272, "No": 0.0009178085869802201}, "ground_truth": 0}, {"key": "37428240", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998979738321226, "res": {"Yes": 0.998979738321226, "No": 0.0010198515515231514}, "ground_truth": 1}, {"key": "37428240", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997195153831671, "res": {"Yes": 0.9997195153831671, "No": 0.0002803359086720244}, "ground_truth": 0}, {"key": "37428240", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992381872268098, "res": {"Yes": 0.9992381872268098, "No": 0.0007615462896633866}, "ground_truth": 0}, {"key": "40612657", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9161200939220172, "res": {"Yes": 0.9161200939220172, "No": 0.0838756612471297}, "ground_truth": 0}, {"key": "40612657", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7420438281289088, "res": {"Yes": 0.7420438281289088, "No": 0.25795343367049}, "ground_truth": 0}, {"key": "40612657", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9635619445657141, "res": {"Yes": 0.9635619445657141, "No": 0.03643759163574281}, "ground_truth": 1}, {"key": "40612657", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5303814575987229, "res": {"Yes": 0.5303814575987229, "No": 0.46960880530244187}, "ground_truth": 0}, {"key": "40612657", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.4196581196569787, "res": {"No": 0.5803373190079073, "Yes": 0.4196581196569787}, "ground_truth": 0}, {"key": "34404662", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 8.533440752811897e-07, "res": {"No": 0.999999091165773, "Yes": 8.533440752811897e-07}, "ground_truth": 0}, {"key": "34404662", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5874814546589583, "res": {"Yes": 0.5874814546589583, "No": 0.4125178505842763}, "ground_truth": 0}, {"key": "34404662", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7749658307155861, "res": {"Yes": 0.7749658307155861, "No": 0.2250286165946309}, "ground_truth": 1}, {"key": "34404662", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.22833263221134134, "res": {"No": 0.771664692074442, "Yes": 0.22833263221134134}, "ground_truth": 0}, {"key": "34404662", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.374687812399694, "res": {"No": 0.6253095511608197, "Yes": 0.374687812399694}, "ground_truth": 0}, {"key": "32619704", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.01798788146079587, "res": {"No": 0.9820114733893983, "Yes": 0.01798788146079587}, "ground_truth": 0}, {"key": "32619704", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.964701530792605, "res": {"Yes": 0.964701530792605, "No": 0.035296834262975495}, "ground_truth": 0}, {"key": "32619704", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9584773571392886, "res": {"Yes": 0.9584773571392886, "No": 0.04152201958708549}, "ground_truth": 1}, {"key": "32619704", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5790162130428861, "res": {"Yes": 0.5790162130428861, "No": 0.4209802030666732}, "ground_truth": 0}, {"key": "32619704", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.4786146183461104, "res": {"No": 0.5213836165569042, "Yes": 0.4786146183461104}, "ground_truth": 0}, {"key": "39014883", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9839545205020463, "res": {"Yes": 0.9839545205020463, "No": 0.016044785069363545}, "ground_truth": 0}, {"key": "39014883", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9476444403526021, "res": {"Yes": 0.9476444403526021, "No": 0.05235403328655726}, "ground_truth": 0}, {"key": "39014883", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.979995785340232, "res": {"Yes": 0.979995785340232, "No": 0.020003450406161263}, "ground_truth": 1}, {"key": "39014883", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9900964929271281, "res": {"Yes": 0.9900964929271281, "No": 0.009902615151575894}, "ground_truth": 0}, {"key": "39014883", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9955411618669912, "res": {"Yes": 0.9955411618669912, "No": 0.00445802382369795}, "ground_truth": 0}, {"key": "37982812", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9788626230956622, "res": {"Yes": 0.9788626230956622, "No": 0.021136133816712626}, "ground_truth": 0}, {"key": "37982812", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.945306051405339, "res": {"Yes": 0.945306051405339, "No": 0.0546910993688363}, "ground_truth": 0}, {"key": "37982812", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.327949154297533, "res": {"No": 0.6720460594228425, "Yes": 0.327949154297533}, "ground_truth": 1}, {"key": "37982812", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9885248832023769, "res": {"Yes": 0.9885248832023769, "No": 0.011473732346857212}, "ground_truth": 0}, {"key": "37982812", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9864558506929012, "res": {"Yes": 0.9864558506929012, "No": 0.013542884482886135}, "ground_truth": 0}, {"key": "28123476", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8091524962471707, "res": {"Yes": 0.8091524962471707, "No": 0.19084702272331608}, "ground_truth": 0}, {"key": "28123476", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986232152389536, "res": {"Yes": 0.9986232152389536, "No": 0.0013753973607179535}, "ground_truth": 0}, {"key": "28123476", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8662589644154723, "res": {"Yes": 0.8662589644154723, "No": 0.13374052992658203}, "ground_truth": 1}, {"key": "28123476", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9890093731528876, "res": {"Yes": 0.9890093731528876, "No": 0.010989834168378168}, "ground_truth": 0}, {"key": "28123476", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990690850304393, "res": {"Yes": 0.9990690850304393, "No": 0.0009308606217538575}, "ground_truth": 0}, {"key": "39078849", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9948242698873808, "res": {"Yes": 0.9948242698873808, "No": 0.005174916889291285}, "ground_truth": 0}, {"key": "39078849", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9774397439896136, "res": {"Yes": 0.9774397439896136, "No": 0.022558394966165282}, "ground_truth": 0}, {"key": "39078849", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.983169081530596, "res": {"Yes": 0.983169081530596, "No": 0.016830110586581}, "ground_truth": 1}, {"key": "39078849", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999121955450369, "res": {"Yes": 0.9999121955450369, "No": 8.68084144784913e-05}, "ground_truth": 0}, {"key": "39078849", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9965993514476454, "res": {"Yes": 0.9965993514476454, "No": 0.0033998080664417022}, "ground_truth": 0}, {"key": "39414137", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8899073569398936, "res": {"Yes": 0.8899073569398936, "No": 0.11008224618298154}, "ground_truth": 0}, {"key": "39414137", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9736598366745485, "res": {"Yes": 0.9736598366745485, "No": 0.026335661702755024}, "ground_truth": 0}, {"key": "39414137", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9915513362635536, "res": {"Yes": 0.9915513362635536, "No": 0.00844801902507144}, "ground_truth": 1}, {"key": "39414137", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9911847372900434, "res": {"Yes": 0.9911847372900434, "No": 0.008813887292245103}, "ground_truth": 0}, {"key": "39414137", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8858515528394426, "res": {"Yes": 0.8858515528394426, "No": 0.1141419533942449}, "ground_truth": 0}, {"key": "37371354", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.005377298330444046, "res": {"No": 0.9946219796113703, "Yes": 0.005377298330444046}, "ground_truth": 0}, {"key": "37371354", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7996274638178096, "res": {"Yes": 0.7996274638178096, "No": 0.20036703886916032}, "ground_truth": 0}, {"key": "37371354", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9972897490795575, "res": {"Yes": 0.9972897490795575, "No": 0.0027098554093427482}, "ground_truth": 1}, {"key": "37371354", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7167847590740233, "res": {"Yes": 0.7167847590740233, "No": 0.28321161629867264}, "ground_truth": 0}, {"key": "37371354", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.952155247862799, "res": {"Yes": 0.952155247862799, "No": 0.0478413811291502}, "ground_truth": 0}, {"key": "29497179", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 8.865795327520446e-07, "res": {"No": 0.9999988527586581, "Yes": 8.865795327520446e-07}, "ground_truth": 0}, {"key": "29497179", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9904624081118878, "res": {"Yes": 0.9904624081118878, "No": 0.009536917108431424}, "ground_truth": 0}, {"key": "29497179", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995809740159199, "res": {"Yes": 0.9995809740159199, "No": 0.00041843248801860713}, "ground_truth": 1}, {"key": "29497179", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.982778724905228, "res": {"Yes": 0.982778724905228, "No": 0.01722100361054447}, "ground_truth": 0}, {"key": "29497179", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7768786643082866, "res": {"Yes": 0.7768786643082866, "No": 0.22311927166229578}, "ground_truth": 0}, {"key": "35908694", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998698901850163, "res": {"Yes": 0.9998698901850163, "No": 0.0001293516362014732}, "ground_truth": 0}, {"key": "35908694", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992258104694797, "res": {"Yes": 0.9992258104694797, "No": 0.0007737683643737098}, "ground_truth": 0}, {"key": "35908694", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996205191610745, "res": {"Yes": 0.9996205191610745, "No": 0.00037880234729918314}, "ground_truth": 1}, {"key": "35908694", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989477386156908, "res": {"Yes": 0.9989477386156908, "No": 0.0010515214117248284}, "ground_truth": 0}, {"key": "35908694", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9935530188370225, "res": {"Yes": 0.9935530188370225, "No": 0.006444163123337399}, "ground_truth": 0}, {"key": "37619358", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7439021437628324, "res": {"Yes": 0.7439021437628324, "No": 0.25609710244379386}, "ground_truth": 0}, {"key": "37619358", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9428191974137753, "res": {"Yes": 0.9428191974137753, "No": 0.057179387724868296}, "ground_truth": 0}, {"key": "37619358", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5253390317770054, "res": {"Yes": 0.5253390317770054, "No": 0.4746585858574306}, "ground_truth": 1}, {"key": "37619358", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5905019565332985, "res": {"Yes": 0.5905019565332985, "No": 0.409495551088818}, "ground_truth": 0}, {"key": "37619358", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5857823938045277, "res": {"Yes": 0.5857823938045277, "No": 0.41421573576545373}, "ground_truth": 0}, {"key": "37293103", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995893111557601, "res": {"Yes": 0.9995893111557601, "No": 0.00041034745743354507}, "ground_truth": 0}, {"key": "37293103", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991530910899628, "res": {"Yes": 0.9991530910899628, "No": 0.0008463140921025406}, "ground_truth": 0}, {"key": "37293103", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998458950338354, "res": {"Yes": 0.998458950338354, "No": 0.0015408413200650086}, "ground_truth": 1}, {"key": "37293103", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997949309895245, "res": {"Yes": 0.9997949309895245, "No": 0.00020494170195029549}, "ground_truth": 0}, {"key": "37293103", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988628120887936, "res": {"Yes": 0.9988628120887936, "No": 0.0011370209940048388}, "ground_truth": 0}, {"key": "36883729", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00012638522170217552, "res": {"No": 0.9998715588292736, "Yes": 0.00012638522170217552}, "ground_truth": 0}, {"key": "36883729", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9979441659276355, "res": {"Yes": 0.9979441659276355, "No": 0.002051625239859953}, "ground_truth": 0}, {"key": "36883729", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9967194218941247, "res": {"Yes": 0.9967194218941247, "No": 0.003277225823443485}, "ground_truth": 1}, {"key": "36883729", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9648703181600897, "res": {"Yes": 0.9648703181600897, "No": 0.03512583076272826}, "ground_truth": 0}, {"key": "36883729", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.966765476336157, "res": {"Yes": 0.966765476336157, "No": 0.033224813089395205}, "ground_truth": 0}, {"key": "39209521", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9913527107487328, "res": {"Yes": 0.9913527107487328, "No": 0.008646259321090335}, "ground_truth": 0}, {"key": "39209521", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994191378657657, "res": {"Yes": 0.9994191378657657, "No": 0.0005800402849647776}, "ground_truth": 0}, {"key": "39209521", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996990219729768, "res": {"Yes": 0.9996990219729768, "No": 0.00030040980463751955}, "ground_truth": 1}, {"key": "39209521", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9852164399092289, "res": {"Yes": 0.9852164399092289, "No": 0.014777145717611545}, "ground_truth": 0}, {"key": "39209521", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.994438857024322, "res": {"Yes": 0.994438857024322, "No": 0.005558281506833193}, "ground_truth": 0}, {"key": "27792571", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977371660774651, "res": {"Yes": 0.9977371660774651, "No": 0.0022618088719890757}, "ground_truth": 0}, {"key": "27792571", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.998332872203969, "res": {"Yes": 0.998332872203969, "No": 0.0016662428125983975}, "ground_truth": 0}, {"key": "27792571", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7969036725846173, "res": {"Yes": 0.7969036725846173, "No": 0.20309466065157158}, "ground_truth": 1}, {"key": "27792571", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9757859677069658, "res": {"Yes": 0.9757859677069658, "No": 0.024213360775704764}, "ground_truth": 0}, {"key": "27792571", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.3101931223961991, "res": {"No": 0.6898020407621065, "Yes": 0.3101931223961991}, "ground_truth": 0}, {"key": "39755647", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9957133373794058, "res": {"Yes": 0.9957133373794058, "No": 0.004286509986894215}, "ground_truth": 0}, {"key": "39755647", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995702575457518, "res": {"Yes": 0.9995702575457518, "No": 0.0004294044110425697}, "ground_truth": 0}, {"key": "39755647", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998412891059067, "res": {"Yes": 0.9998412891059067, "No": 0.0001582405839208988}, "ground_truth": 1}, {"key": "39755647", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997564405154282, "res": {"Yes": 0.9997564405154282, "No": 0.00024284552897170416}, "ground_truth": 0}, {"key": "39755647", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999467124528592, "res": {"Yes": 0.999467124528592, "No": 0.0005322171368075851}, "ground_truth": 0}, {"key": "40800537", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5118977914217355, "res": {"Yes": 0.5118977914217355, "No": 0.4881005252393407}, "ground_truth": 0}, {"key": "40800537", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994249717921264, "res": {"Yes": 0.9994249717921264, "No": 0.0005747839079861647}, "ground_truth": 0}, {"key": "40800537", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994823672680727, "res": {"Yes": 0.9994823672680727, "No": 0.0005175160597359964}, "ground_truth": 1}, {"key": "40800537", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996486299449218, "res": {"Yes": 0.9996486299449218, "No": 0.00035087567483230045}, "ground_truth": 0}, {"key": "40800537", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985698336639972, "res": {"Yes": 0.9985698336639972, "No": 0.0014291891835909562}, "ground_truth": 0}, {"key": "14171461", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0007232747457769576, "res": {"No": 0.9992741306307236, "Yes": 0.0007232747457769576}, "ground_truth": 0}, {"key": "14171461", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.20422952399210934, "res": {"No": 0.7957697848349156, "Yes": 0.20422952399210934}, "ground_truth": 0}, {"key": "14171461", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992803209932531, "res": {"Yes": 0.9992803209932531, "No": 0.000719188043260488}, "ground_truth": 1}, {"key": "14171461", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9426950249893242, "res": {"Yes": 0.9426950249893242, "No": 0.05730221498929092}, "ground_truth": 0}, {"key": "14171461", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.18808988851898167, "res": {"No": 0.8119050168379423, "Yes": 0.18808988851898167}, "ground_truth": 0}, {"key": "36892440", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4729423876108062, "res": {"No": 0.5270541944286591, "Yes": 0.4729423876108062}, "ground_truth": 0}, {"key": "36892440", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9543173050121861, "res": {"Yes": 0.9543173050121861, "No": 0.0456814943832618}, "ground_truth": 0}, {"key": "36892440", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8519576755255068, "res": {"Yes": 0.8519576755255068, "No": 0.14803730147215266}, "ground_truth": 1}, {"key": "36892440", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.26681114311886456, "res": {"No": 0.7331847958014068, "Yes": 0.26681114311886456}, "ground_truth": 0}, {"key": "36892440", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.07185184415860926, "res": {"No": 0.9281420284572992, "Yes": 0.07185184415860926}, "ground_truth": 0}, {"key": "33733410", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7103734793479339, "res": {"Yes": 0.7103734793479339, "No": 0.2896234349372256}, "ground_truth": 0}, {"key": "33733410", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9485072272248384, "res": {"Yes": 0.9485072272248384, "No": 0.05149196000024464}, "ground_truth": 0}, {"key": "33733410", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990507596139651, "res": {"Yes": 0.9990507596139651, "No": 0.0009488005025992405}, "ground_truth": 1}, {"key": "33733410", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4526743301661762, "res": {"No": 0.5473245090982632, "Yes": 0.4526743301661762}, "ground_truth": 0}, {"key": "33733410", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9310162476791946, "res": {"Yes": 0.9310162476791946, "No": 0.06898087408377601}, "ground_truth": 0}, {"key": "38587765", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9501337697853708, "res": {"Yes": 0.9501337697853708, "No": 0.049865320390052245}, "ground_truth": 0}, {"key": "38587765", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998946743031407, "res": {"Yes": 0.9998946743031407, "No": 0.00010515553690478061}, "ground_truth": 0}, {"key": "38587765", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995249953204606, "res": {"Yes": 0.9995249953204606, "No": 0.0004746843030731348}, "ground_truth": 1}, {"key": "38587765", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992910343949607, "res": {"Yes": 0.9992910343949607, "No": 0.0007087132897719386}, "ground_truth": 0}, {"key": "38587765", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994288995399836, "res": {"Yes": 0.9994288995399836, "No": 0.0005707265840657573}, "ground_truth": 0}, {"key": "41065582", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.07325044177830554, "res": {"No": 0.9267395620283948, "Yes": 0.07325044177830554}, "ground_truth": 0}, {"key": "41065582", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9804907474041511, "res": {"Yes": 0.9804907474041511, "No": 0.0195027168007815}, "ground_truth": 0}, {"key": "41065582", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.42337490171105013, "res": {"No": 0.5766201431681363, "Yes": 0.42337490171105013}, "ground_truth": 1}, {"key": "41065582", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9951016051583162, "res": {"Yes": 0.9951016051583162, "No": 0.004897531383993527}, "ground_truth": 0}, {"key": "41065582", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9709554376483656, "res": {"Yes": 0.9709554376483656, "No": 0.029041135167487887}, "ground_truth": 0}, {"key": "34713891", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 6.894277026227788e-07, "res": {"No": 0.99999861435166, "Yes": 6.894277026227788e-07}, "ground_truth": 0}, {"key": "34713891", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9859984434814172, "res": {"Yes": 0.9859984434814172, "No": 0.014001291550707748}, "ground_truth": 0}, {"key": "34713891", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9888933622349305, "res": {"Yes": 0.9888933622349305, "No": 0.01110573874733603}, "ground_truth": 1}, {"key": "34713891", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978883739258728, "res": {"Yes": 0.9978883739258728, "No": 0.0021095787415101085}, "ground_truth": 0}, {"key": "34713891", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9907125017253027, "res": {"Yes": 0.9907125017253027, "No": 0.009284923716401154}, "ground_truth": 0}, {"key": "18913023", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5653374497090141, "res": {"Yes": 0.5653374497090141, "No": 0.4346597229932614}, "ground_truth": 0}, {"key": "18913023", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9835186917456176, "res": {"Yes": 0.9835186917456176, "No": 0.01648062220591883}, "ground_truth": 0}, {"key": "18913023", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9739984321920341, "res": {"Yes": 0.9739984321920341, "No": 0.026000877279777082}, "ground_truth": 1}, {"key": "18913023", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9507451152242585, "res": {"Yes": 0.9507451152242585, "No": 0.04925178344196918}, "ground_truth": 0}, {"key": "18913023", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.60657945100126, "res": {"Yes": 0.60657945100126, "No": 0.3934190146724066}, "ground_truth": 0}, {"key": "36884100", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.992394289116153, "res": {"Yes": 0.992394289116153, "No": 0.007605433141959359}, "ground_truth": 0}, {"key": "36884100", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9916949342011387, "res": {"Yes": 0.9916949342011387, "No": 0.008304389903200055}, "ground_truth": 0}, {"key": "36884100", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9955209529847385, "res": {"Yes": 0.9955209529847385, "No": 0.004478558713739424}, "ground_truth": 1}, {"key": "36884100", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9744951616531524, "res": {"Yes": 0.9744951616531524, "No": 0.025503675498715395}, "ground_truth": 0}, {"key": "36884100", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8283779395549925, "res": {"Yes": 0.8283779395549925, "No": 0.17161973374948122}, "ground_truth": 0}, {"key": "39899913", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9912314707697235, "res": {"Yes": 0.9912314707697235, "No": 0.008768057419860165}, "ground_truth": 0}, {"key": "39899913", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996463658732931, "res": {"Yes": 0.9996463658732931, "No": 0.000353196711452924}, "ground_truth": 0}, {"key": "39899913", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968108643308776, "res": {"Yes": 0.9968108643308776, "No": 0.0031891208365422883}, "ground_truth": 1}, {"key": "39899913", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9953378636541825, "res": {"Yes": 0.9953378636541825, "No": 0.004661385767741294}, "ground_truth": 0}, {"key": "39899913", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990036520845255, "res": {"Yes": 0.9990036520845255, "No": 0.000995950201623117}, "ground_truth": 0}, {"key": "30725366", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9914960251065645, "res": {"Yes": 0.9914960251065645, "No": 0.008503319179517249}, "ground_truth": 0}, {"key": "30725366", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980690656570336, "res": {"Yes": 0.9980690656570336, "No": 0.001930913638990792}, "ground_truth": 0}, {"key": "30725366", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998899066707154, "res": {"Yes": 0.9998899066707154, "No": 0.00011000706136554405}, "ground_truth": 1}, {"key": "30725366", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994711753170884, "res": {"Yes": 0.9994711753170884, "No": 0.0005286461254250795}, "ground_truth": 0}, {"key": "30725366", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997557364771932, "res": {"Yes": 0.9997557364771932, "No": 0.00024381617445209776}, "ground_truth": 0}, {"key": "26133523", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.003540651603463614, "res": {"No": 0.996458362445547, "Yes": 0.003540651603463614}, "ground_truth": 0}, {"key": "26133523", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999773963544663, "res": {"Yes": 0.9999773963544663, "No": 2.2459002992497756e-05}, "ground_truth": 0}, {"key": "26133523", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996445784572067, "res": {"Yes": 0.9996445784572067, "No": 0.0003548233137971736}, "ground_truth": 1}, {"key": "26133523", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984551455180815, "res": {"Yes": 0.9984551455180815, "No": 0.0015447194050202979}, "ground_truth": 0}, {"key": "26133523", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997305946361441, "res": {"Yes": 0.9997305946361441, "No": 0.0002691122443908325}, "ground_truth": 0}, {"key": "29332665", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9961342598857902, "res": {"Yes": 0.9961342598857902, "No": 0.0038654359847721475}, "ground_truth": 0}, {"key": "29332665", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9850166582737578, "res": {"Yes": 0.9850166582737578, "No": 0.014983071228169591}, "ground_truth": 0}, {"key": "29332665", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.932572101322645, "res": {"Yes": 0.932572101322645, "No": 0.06742760332656329}, "ground_truth": 1}, {"key": "29332665", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999937345628867, "res": {"Yes": 0.999937345628867, "No": 6.259463414910865e-05}, "ground_truth": 0}, {"key": "29332665", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992381872268098, "res": {"Yes": 0.9992381872268098, "No": 0.0007613081152364017}, "ground_truth": 0}, {"key": "37400481", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00686175252331653, "res": {"No": 0.9931380206405095, "Yes": 0.00686175252331653}, "ground_truth": 0}, {"key": "37400481", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9949551313111149, "res": {"Yes": 0.9949551313111149, "No": 0.005044259070929017}, "ground_truth": 0}, {"key": "37400481", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9961902185026325, "res": {"Yes": 0.9961902185026325, "No": 0.0038089755900471314}, "ground_truth": 1}, {"key": "37400481", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9695561107569677, "res": {"Yes": 0.9695561107569677, "No": 0.030442738079032337}, "ground_truth": 0}, {"key": "37400481", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992968712109814, "res": {"Yes": 0.9992968712109814, "No": 0.0007026230583982924}, "ground_truth": 0}, {"key": "38787241", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998022009648091, "res": {"Yes": 0.9998022009648091, "No": 0.0001973665299102955}, "ground_truth": 0}, {"key": "38787241", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999696483206215, "res": {"Yes": 0.9999696483206215, "No": 2.943936010216435e-05}, "ground_truth": 0}, {"key": "38787241", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999983237218497, "res": {"Yes": 0.999983237218497, "No": 1.6446678763707134e-05}, "ground_truth": 1}, {"key": "38787241", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999557020111849, "res": {"Yes": 0.9999557020111849, "No": 4.4175598122881555e-05}, "ground_truth": 0}, {"key": "38787241", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999804955832136, "res": {"Yes": 0.9999804955832136, "No": 1.9145095208992116e-05}, "ground_truth": 0}, {"key": "38225963", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.873183020185396, "res": {"Yes": 0.873183020185396, "No": 0.12681635026299273}, "ground_truth": 0}, {"key": "38225963", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9743997320658628, "res": {"Yes": 0.9743997320658628, "No": 0.025598544105314057}, "ground_truth": 0}, {"key": "38225963", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.996499077569562, "res": {"Yes": 0.996499077569562, "No": 0.003500586685869671}, "ground_truth": 1}, {"key": "38225963", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9761374036984964, "res": {"Yes": 0.9761374036984964, "No": 0.023861480852725176}, "ground_truth": 0}, {"key": "38225963", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9828789066119891, "res": {"Yes": 0.9828789066119891, "No": 0.017120573671168732}, "ground_truth": 0}, {"key": "26072034", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0414394480655965, "res": {"No": 0.9585511819082908, "Yes": 0.0414394480655965}, "ground_truth": 0}, {"key": "26072034", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9838762834849827, "res": {"Yes": 0.9838762834849827, "No": 0.016121612756157172}, "ground_truth": 0}, {"key": "26072034", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9806145264855588, "res": {"Yes": 0.9806145264855588, "No": 0.01937717406948241}, "ground_truth": 1}, {"key": "26072034", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1631302365442058, "res": {"No": 0.8368639805517002, "Yes": 0.1631302365442058}, "ground_truth": 0}, {"key": "26072034", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7970488896323963, "res": {"Yes": 0.7970488896323963, "No": 0.20294578592850418}, "ground_truth": 0}, {"key": "35690810", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7798406851250643, "res": {"Yes": 0.7798406851250643, "No": 0.22015892655466968}, "ground_truth": 0}, {"key": "35690810", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999360320122465, "res": {"Yes": 0.999360320122465, "No": 0.0006391371464074557}, "ground_truth": 0}, {"key": "35690810", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9971388423357402, "res": {"Yes": 0.9971388423357402, "No": 0.002861057406295348}, "ground_truth": 1}, {"key": "35690810", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989618945047095, "res": {"Yes": 0.9989618945047095, "No": 0.0010378712900000562}, "ground_truth": 0}, {"key": "35690810", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997316671676959, "res": {"Yes": 0.9997316671676959, "No": 0.0002677405883878171}, "ground_truth": 0}, {"key": "36855665", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0007316535854053498, "res": {"No": 0.9992679512085556, "Yes": 0.0007316535854053498}, "ground_truth": 0}, {"key": "36855665", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.007590676204811479, "res": {"No": 0.9924089629650757, "Yes": 0.007590676204811479}, "ground_truth": 0}, {"key": "36855665", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.44870221478875555, "res": {"No": 0.5512945164592483, "Yes": 0.44870221478875555}, "ground_truth": 1}, {"key": "36855665", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.41835026617131016, "res": {"No": 0.5816377777537318, "Yes": 0.41835026617131016}, "ground_truth": 0}, {"key": "36855665", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.40384283459091175, "res": {"No": 0.5961560961001057, "Yes": 0.40384283459091175}, "ground_truth": 0}, {"key": "29757662", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9241127564458976, "res": {"Yes": 0.9241127564458976, "No": 0.07588416849998972}, "ground_truth": 0}, {"key": "29757662", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9949129988382674, "res": {"Yes": 0.9949129988382674, "No": 0.0050844810995914844}, "ground_truth": 0}, {"key": "29757662", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.995181638328546, "res": {"Yes": 0.995181638328546, "No": 0.004817558569958976}, "ground_truth": 1}, {"key": "29757662", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9875065384634206, "res": {"Yes": 0.9875065384634206, "No": 0.012489000276021747}, "ground_truth": 0}, {"key": "29757662", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.992227490884428, "res": {"Yes": 0.992227490884428, "No": 0.007757682005820856}, "ground_truth": 0}, {"key": "19134339", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.373461391212498, "res": {"No": 0.6265381203304251, "Yes": 0.373461391212498}, "ground_truth": 0}, {"key": "19134339", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994246143578434, "res": {"Yes": 0.9994246143578434, "No": 0.000575343099693236}, "ground_truth": 0}, {"key": "19134339", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9962478286532871, "res": {"Yes": 0.9962478286532871, "No": 0.003751927766584099}, "ground_truth": 1}, {"key": "19134339", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9851315238230884, "res": {"Yes": 0.9851315238230884, "No": 0.014868431572966252}, "ground_truth": 0}, {"key": "19134339", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9727784641684676, "res": {"Yes": 0.9727784641684676, "No": 0.027221300650548435}, "ground_truth": 0}, {"key": "35360732", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9777391434630773, "res": {"Yes": 0.9777391434630773, "No": 0.02225940195161315}, "ground_truth": 0}, {"key": "35360732", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9879838564433493, "res": {"Yes": 0.9879838564433493, "No": 0.01201398008746227}, "ground_truth": 0}, {"key": "35360732", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9734788267706387, "res": {"Yes": 0.9734788267706387, "No": 0.026519164995527568}, "ground_truth": 1}, {"key": "35360732", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9624448106967654, "res": {"Yes": 0.9624448106967654, "No": 0.037553807792041614}, "ground_truth": 0}, {"key": "35360732", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9774252789658765, "res": {"Yes": 0.9774252789658765, "No": 0.022573128151363628}, "ground_truth": 0}, {"key": "37713629", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.012485833467120093, "res": {"No": 0.9875121169036126, "Yes": 0.012485833467120093}, "ground_truth": 0}, {"key": "37713629", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8021303364843545, "res": {"Yes": 0.8021303364843545, "No": 0.1978493888721106}, "ground_truth": 0}, {"key": "37713629", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9959409015013476, "res": {"Yes": 0.9959409015013476, "No": 0.0040564178410049355}, "ground_truth": 1}, {"key": "37713629", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9961476231165203, "res": {"Yes": 0.9961476231165203, "No": 0.0038510493861158707}, "ground_truth": 0}, {"key": "37713629", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.006041449574812024, "res": {"No": 0.9939495143577456, "Yes": 0.006041449574812024}, "ground_truth": 0}, {"key": "33393394", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00037645098692826596, "res": {"No": 0.9996231406593272, "Yes": 0.00037645098692826596}, "ground_truth": 0}, {"key": "33393394", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8818760197788444, "res": {"Yes": 0.8818760197788444, "No": 0.11812328639292673}, "ground_truth": 0}, {"key": "33393394", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9959381815904597, "res": {"Yes": 0.9959381815904597, "No": 0.004061532148821905}, "ground_truth": 1}, {"key": "33393394", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8615436128305898, "res": {"Yes": 0.8615436128305898, "No": 0.13845526526572396}, "ground_truth": 0}, {"key": "33393394", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9980620609334907, "res": {"Yes": 0.9980620609334907, "No": 0.001937850325345381}, "ground_truth": 0}, {"key": "32275837", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9153078291356951, "res": {"Yes": 0.9153078291356951, "No": 0.0846911812684766}, "ground_truth": 0}, {"key": "32275837", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996925906099522, "res": {"Yes": 0.9996925906099522, "No": 0.00030681855842423544}, "ground_truth": 0}, {"key": "32275837", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984672709308401, "res": {"Yes": 0.9984672709308401, "No": 0.0015313259268789335}, "ground_truth": 1}, {"key": "32275837", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9972015361207057, "res": {"Yes": 0.9972015361207057, "No": 0.0027970471711379584}, "ground_truth": 0}, {"key": "32275837", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9853458191447234, "res": {"Yes": 0.9853458191447234, "No": 0.014647919020366064}, "ground_truth": 0}, {"key": "21458094", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9981499397750988, "res": {"Yes": 0.9981499397750988, "No": 0.0018482574549814326}, "ground_truth": 0}, {"key": "21458094", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9758371529265389, "res": {"Yes": 0.9758371529265389, "No": 0.024157243644163974}, "ground_truth": 0}, {"key": "21458094", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9949940733235776, "res": {"Yes": 0.9949940733235776, "No": 0.005003463031445408}, "ground_truth": 1}, {"key": "21458094", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9817481793698929, "res": {"Yes": 0.9817481793698929, "No": 0.018245850402733136}, "ground_truth": 0}, {"key": "21458094", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9963837920857171, "res": {"Yes": 0.9963837920857171, "No": 0.0036118964939428322}, "ground_truth": 0}, {"key": "40975362", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9979062992555192, "res": {"Yes": 0.9979062992555192, "No": 0.002093407830468389}, "ground_truth": 0}, {"key": "40975362", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9855068407629586, "res": {"Yes": 0.9855068407629586, "No": 0.01449261600930928}, "ground_truth": 0}, {"key": "40975362", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9625538079684349, "res": {"Yes": 0.9625538079684349, "No": 0.037444759951389246}, "ground_truth": 1}, {"key": "40975362", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9704742203424686, "res": {"Yes": 0.9704742203424686, "No": 0.02952504183396408}, "ground_truth": 0}, {"key": "40975362", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7023246622714084, "res": {"Yes": 0.7023246622714084, "No": 0.2976746700705779}, "ground_truth": 0}, {"key": "35234201", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.20146794341568042, "res": {"No": 0.7985251382353558, "Yes": 0.20146794341568042}, "ground_truth": 0}, {"key": "35234201", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.001049058378021149, "res": {"No": 0.9989488067910788, "Yes": 0.001049058378021149}, "ground_truth": 0}, {"key": "35234201", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8855584819089176, "res": {"Yes": 0.8855584819089176, "No": 0.11443329524839298}, "ground_truth": 1}, {"key": "35234201", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.368916480746731, "res": {"No": 0.6310673542887376, "Yes": 0.368916480746731}, "ground_truth": 0}, {"key": "35234201", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9005792874420518, "res": {"Yes": 0.9005792874420518, "No": 0.09941460942628229}, "ground_truth": 0}, {"key": "36037573", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5779571430679749, "res": {"Yes": 0.5779571430679749, "No": 0.422031906493394}, "ground_truth": 0}, {"key": "36037573", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980951962456861, "res": {"Yes": 0.9980951962456861, "No": 0.001898628491586151}, "ground_truth": 0}, {"key": "36037573", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9793071638558044, "res": {"Yes": 0.9793071638558044, "No": 0.02068396120612216}, "ground_truth": 1}, {"key": "36037573", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8773885063546527, "res": {"Yes": 0.8773885063546527, "No": 0.12259408536452673}, "ground_truth": 0}, {"key": "36037573", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9826434606197894, "res": {"Yes": 0.9826434606197894, "No": 0.017345008647532714}, "ground_truth": 0}, {"key": "30861915", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977098703574554, "res": {"Yes": 0.9977098703574554, "No": 0.002289831602834534}, "ground_truth": 0}, {"key": "30861915", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989770030185493, "res": {"Yes": 0.9989770030185493, "No": 0.0010228959580199787}, "ground_truth": 0}, {"key": "30861915", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999847868417213, "res": {"Yes": 0.9999847868417213, "No": 1.5001040389009605e-05}, "ground_truth": 1}, {"key": "30861915", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999011106398752, "res": {"Yes": 0.9999011106398752, "No": 9.879673503114135e-05}, "ground_truth": 0}, {"key": "30861915", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981637236222345, "res": {"Yes": 0.9981637236222345, "No": 0.0018360275159413151}, "ground_truth": 0}, {"key": "40173012", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9638357371867584, "res": {"Yes": 0.9638357371867584, "No": 0.03616057652004296}, "ground_truth": 0}, {"key": "40173012", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9904921135154147, "res": {"Yes": 0.9904921135154147, "No": 0.009503972593942518}, "ground_truth": 0}, {"key": "40173012", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9954962646698935, "res": {"Yes": 0.9954962646698935, "No": 0.004503185246705432}, "ground_truth": 1}, {"key": "40173012", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978570334385091, "res": {"Yes": 0.9978570334385091, "No": 0.0021423485466557073}, "ground_truth": 0}, {"key": "40173012", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9639516993842906, "res": {"Yes": 0.9639516993842906, "No": 0.036045793760211796}, "ground_truth": 0}, {"key": "35100330", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8198726874377952, "res": {"Yes": 0.8198726874377952, "No": 0.18012547276794438}, "ground_truth": 0}, {"key": "35100330", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999786707670044, "res": {"Yes": 0.999786707670044, "No": 0.00021318739293415395}, "ground_truth": 0}, {"key": "35100330", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999830324176571, "res": {"Yes": 0.999830324176571, "No": 0.00016946383783694567}, "ground_truth": 1}, {"key": "35100330", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9804828368367123, "res": {"Yes": 0.9804828368367123, "No": 0.019516699407981383}, "ground_truth": 0}, {"key": "35100330", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999368688428554, "res": {"Yes": 0.9999368688428554, "No": 6.250493777141229e-05}, "ground_truth": 0}, {"key": "37220221", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.31146886425124587, "res": {"No": 0.688529462105394, "Yes": 0.31146886425124587}, "ground_truth": 0}, {"key": "37220221", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9421206849063892, "res": {"Yes": 0.9421206849063892, "No": 0.05787785137330902}, "ground_truth": 0}, {"key": "37220221", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4987329234804044, "res": {"No": 0.501263960188028, "Yes": 0.4987329234804044}, "ground_truth": 1}, {"key": "37220221", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8943924214064252, "res": {"Yes": 0.8943924214064252, "No": 0.10560527038568879}, "ground_truth": 0}, {"key": "37220221", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9940947501360121, "res": {"Yes": 0.9940947501360121, "No": 0.005903531782269157}, "ground_truth": 0}, {"key": "38815218", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3690146108227095, "res": {"No": 0.6309824498882897, "Yes": 0.3690146108227095}, "ground_truth": 0}, {"key": "38815218", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6290712208470044, "res": {"Yes": 0.6290712208470044, "No": 0.3709209543969753}, "ground_truth": 0}, {"key": "38815218", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.16156240536954147, "res": {"No": 0.8384277225025628, "Yes": 0.16156240536954147}, "ground_truth": 1}, {"key": "38815218", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.24115955755884827, "res": {"No": 0.7588338970521663, "Yes": 0.24115955755884827}, "ground_truth": 0}, {"key": "38815218", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.2195339694777475, "res": {"No": 0.7804560817409737, "Yes": 0.2195339694777475}, "ground_truth": 0}, {"key": "39379109", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9948371340431877, "res": {"Yes": 0.9948371340431877, "No": 0.005162757205744895}, "ground_truth": 0}, {"key": "39379109", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9695451296266434, "res": {"Yes": 0.9695451296266434, "No": 0.030454351153808255}, "ground_truth": 0}, {"key": "39379109", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9939758981038183, "res": {"Yes": 0.9939758981038183, "No": 0.006023658379517895}, "ground_truth": 1}, {"key": "39379109", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978717537344701, "res": {"Yes": 0.9978717537344701, "No": 0.0021277770132497017}, "ground_truth": 0}, {"key": "39379109", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9945035918303118, "res": {"Yes": 0.9945035918303118, "No": 0.005494154335819687}, "ground_truth": 0}, {"key": "14576125", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998919329096687, "res": {"Yes": 0.9998919329096687, "No": 0.00010750684908580641}, "ground_truth": 0}, {"key": "14576125", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997216604436437, "res": {"Yes": 0.9997216604436437, "No": 0.0002780181941034143}, "ground_truth": 0}, {"key": "14576125", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997578706180514, "res": {"Yes": 0.9997578706180514, "No": 0.000241653663362792}, "ground_truth": 1}, {"key": "14576125", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994924906764456, "res": {"Yes": 0.9994924906764456, "No": 0.0005070237557236824}, "ground_truth": 0}, {"key": "14576125", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994040152095309, "res": {"Yes": 0.9994040152095309, "No": 0.0005954403155312532}, "ground_truth": 0}, {"key": "40814250", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9991777236046737, "res": {"Yes": 0.9991777236046737, "No": 0.0008222135528458066}, "ground_truth": 0}, {"key": "40814250", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999466429775365, "res": {"Yes": 0.9999466429775365, "No": 5.3155286199181564e-05}, "ground_truth": 0}, {"key": "40814250", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999757275415809, "res": {"Yes": 0.9999757275415809, "No": 2.4164377823713275e-05}, "ground_truth": 1}, {"key": "40814250", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999782307609533, "res": {"Yes": 0.9999782307609533, "No": 2.1618416301191472e-05}, "ground_truth": 0}, {"key": "40814250", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998478406274117, "res": {"Yes": 0.9998478406274117, "No": 0.0001520545834400898}, "ground_truth": 0}, {"key": "36334488", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9979322920594118, "res": {"Yes": 0.9979322920594118, "No": 0.002067005163956391}, "ground_truth": 0}, {"key": "36334488", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9789144934214636, "res": {"Yes": 0.9789144934214636, "No": 0.02108410162489671}, "ground_truth": 0}, {"key": "36334488", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9937541663191191, "res": {"Yes": 0.9937541663191191, "No": 0.006244253363738221}, "ground_truth": 1}, {"key": "36334488", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998288939803051, "res": {"Yes": 0.9998288939803051, "No": 0.0001704732781357703}, "ground_truth": 0}, {"key": "36334488", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9941833372696545, "res": {"Yes": 0.9941833372696545, "No": 0.005814142310121107}, "ground_truth": 0}, {"key": "36888322", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.633485061752596, "res": {"Yes": 0.633485061752596, "No": 0.3665141683045704}, "ground_truth": 0}, {"key": "36888322", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5018717851401293, "res": {"Yes": 0.5018717851401293, "No": 0.4981276547332073}, "ground_truth": 0}, {"key": "36888322", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.02763412104679233, "res": {"No": 0.97236520284148, "Yes": 0.02763412104679233}, "ground_truth": 1}, {"key": "36888322", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.075678339162995, "res": {"No": 0.924320782852399, "Yes": 0.075678339162995}, "ground_truth": 0}, {"key": "36888322", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.19900858788257178, "res": {"No": 0.8009910544128886, "Yes": 0.19900858788257178}, "ground_truth": 0}, {"key": "37318916", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0002627180904792188, "res": {"No": 0.9997352423245008, "Yes": 0.0002627180904792188}, "ground_truth": 0}, {"key": "37318916", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 8.103867889862081e-05, "res": {"No": 0.9999141026393895, "Yes": 8.103867889862081e-05}, "ground_truth": 1}, {"key": "37318916", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 6.388015462846994e-07, "res": {"No": 0.9999981375378344, "Yes": 6.388015462846994e-07}, "ground_truth": 0}, {"key": "37318916", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.005629948411592285, "res": {"No": 0.994360827463141, "Yes": 0.005629948411592285}, "ground_truth": 0}, {"key": "39308700", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 3.538583355432419e-05, "res": {"No": 0.9999638075349631, "Yes": 3.538583355432419e-05}, "ground_truth": 0}, {"key": "39308700", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.06287675741616071, "res": {"No": 0.9371224483610182, "Yes": 0.06287675741616071}, "ground_truth": 0}, {"key": "39308700", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9061569263917562, "res": {"Yes": 0.9061569263917562, "No": 0.09384084218370745}, "ground_truth": 1}, {"key": "39308700", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07798108357297927, "res": {"No": 0.9220126457090713, "Yes": 0.07798108357297927}, "ground_truth": 0}, {"key": "39308700", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.13139631729482373, "res": {"No": 0.8685996168444821, "Yes": 0.13139631729482373}, "ground_truth": 0}, {"key": "31061543", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.03038830647489268, "res": {"No": 0.9696111326883183, "Yes": 0.03038830647489268}, "ground_truth": 0}, {"key": "31061543", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990354080182265, "res": {"Yes": 0.9990354080182265, "No": 0.0009639848299923567}, "ground_truth": 0}, {"key": "31061543", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9826256189244511, "res": {"Yes": 0.9826256189244511, "No": 0.0173741640659656}, "ground_truth": 1}, {"key": "31061543", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998323502947827, "res": {"Yes": 0.9998323502947827, "No": 0.00016759972679819307}, "ground_truth": 0}, {"key": "31061543", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9966164073948934, "res": {"Yes": 0.9966164073948934, "No": 0.003383461436074731}, "ground_truth": 0}, {"key": "37380894", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9928010256540089, "res": {"Yes": 0.9928010256540089, "No": 0.007198767126878864}, "ground_truth": 0}, {"key": "37380894", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985956350446861, "res": {"Yes": 0.9985956350446861, "No": 0.0014042470883632889}, "ground_truth": 0}, {"key": "37380894", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999932458601023, "res": {"Yes": 0.999932458601023, "No": 6.735812661176589e-05}, "ground_truth": 1}, {"key": "37380894", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982115842247619, "res": {"Yes": 0.9982115842247619, "No": 0.0017878705574744275}, "ground_truth": 0}, {"key": "37380894", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977294538982989, "res": {"Yes": 0.9977294538982989, "No": 0.0022705140940050867}, "ground_truth": 0}, {"key": "38410139", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.16803015863590176, "res": {"No": 0.8319687491368161, "Yes": 0.16803015863590176}, "ground_truth": 0}, {"key": "38410139", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994904652569402, "res": {"Yes": 0.9994904652569402, "No": 0.000508844036479}, "ground_truth": 0}, {"key": "38410139", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9947162159541605, "res": {"Yes": 0.9947162159541605, "No": 0.0052827525543013044}, "ground_truth": 1}, {"key": "38410139", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9985750675816399, "res": {"Yes": 0.9985750675816399, "No": 0.0014242655523305809}, "ground_truth": 0}, {"key": "38410139", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9760717509046518, "res": {"Yes": 0.9760717509046518, "No": 0.023927592214231463}, "ground_truth": 0}, {"key": "35953842", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0004740165600808717, "res": {"No": 0.9995251144438566, "Yes": 0.0004740165600808717}, "ground_truth": 0}, {"key": "35953842", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9776361303829959, "res": {"Yes": 0.9776361303829959, "No": 0.02236284282304674}, "ground_truth": 0}, {"key": "35953842", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998812057965902, "res": {"Yes": 0.9998812057965902, "No": 0.00011863215342585711}, "ground_truth": 1}, {"key": "35953842", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9964569480735511, "res": {"Yes": 0.9964569480735511, "No": 0.003542740495733114}, "ground_truth": 0}, {"key": "35953842", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8347285890692967, "res": {"Yes": 0.8347285890692967, "No": 0.16527002955513792}, "ground_truth": 0}, {"key": "39815663", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9394377039412803, "res": {"Yes": 0.9394377039412803, "No": 0.060561917956664824}, "ground_truth": 0}, {"key": "39815663", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9937511084428786, "res": {"Yes": 0.9937511084428786, "No": 0.0062477367550925755}, "ground_truth": 0}, {"key": "39815663", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5754012588987195, "res": {"Yes": 0.5754012588987195, "No": 0.4245932402999402}, "ground_truth": 1}, {"key": "39815663", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997215412768289, "res": {"Yes": 0.9997215412768289, "No": 0.00027824626251784986}, "ground_truth": 0}, {"key": "39815663", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9883860526552236, "res": {"Yes": 0.9883860526552236, "No": 0.01161363430450042}, "ground_truth": 0}, {"key": "35121432", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8406719133891104, "res": {"Yes": 0.8406719133891104, "No": 0.15932159650093525}, "ground_truth": 0}, {"key": "35121432", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9463219217362338, "res": {"Yes": 0.9463219217362338, "No": 0.0536759626814211}, "ground_truth": 0}, {"key": "35121432", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974213675990116, "res": {"Yes": 0.9974213675990116, "No": 0.0025751270661660817}, "ground_truth": 1}, {"key": "35121432", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.983159983326013, "res": {"Yes": 0.983159983326013, "No": 0.016836308574278487}, "ground_truth": 0}, {"key": "35121432", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9324993206405827, "res": {"Yes": 0.9324993206405827, "No": 0.06748769459628448}, "ground_truth": 0}, {"key": "21712310", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9819684838321217, "res": {"Yes": 0.9819684838321217, "No": 0.01803106275137732}, "ground_truth": 0}, {"key": "21712310", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9434133946127949, "res": {"Yes": 0.9434133946127949, "No": 0.056582942978227205}, "ground_truth": 0}, {"key": "21712310", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9973369292808792, "res": {"Yes": 0.9973369292808792, "No": 0.0026628050013761135}, "ground_truth": 1}, {"key": "21712310", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993628218842474, "res": {"Yes": 0.9993628218842474, "No": 0.0006370161815292987}, "ground_truth": 0}, {"key": "21712310", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.998576135258673, "res": {"Yes": 0.998576135258673, "No": 0.0014238322142587384}, "ground_truth": 0}, {"key": "37952914", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7648591345149638, "res": {"Yes": 0.7648591345149638, "No": 0.23513967022638457}, "ground_truth": 0}, {"key": "37952914", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9934260551463727, "res": {"Yes": 0.9934260551463727, "No": 0.0065727300504661796}, "ground_truth": 0}, {"key": "37952914", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9963615434825955, "res": {"Yes": 0.9963615434825955, "No": 0.003638088036613208}, "ground_truth": 1}, {"key": "37952914", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9950974747986556, "res": {"Yes": 0.9950974747986556, "No": 0.00490061290026933}, "ground_truth": 0}, {"key": "37952914", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.995358536339552, "res": {"Yes": 0.995358536339552, "No": 0.004640846472333357}, "ground_truth": 0}, {"key": "38956779", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9961912838290218, "res": {"Yes": 0.9961912838290218, "No": 0.0038084119033736496}, "ground_truth": 0}, {"key": "38956779", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9930598397217505, "res": {"Yes": 0.9930598397217505, "No": 0.0069392054464634464}, "ground_truth": 1}, {"key": "38956779", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9964417988544367, "res": {"Yes": 0.9964417988544367, "No": 0.00355785657898025}, "ground_truth": 0}, {"key": "38956779", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991505899531264, "res": {"Yes": 0.9991505899531264, "No": 0.0008488859628927144}, "ground_truth": 0}, {"key": "36101833", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.978162468043803, "res": {"Yes": 0.978162468043803, "No": 0.021837069882396757}, "ground_truth": 0}, {"key": "36101833", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974590787192202, "res": {"Yes": 0.9974590787192202, "No": 0.002539578897708074}, "ground_truth": 0}, {"key": "36101833", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9944164552541848, "res": {"Yes": 0.9944164552541848, "No": 0.005583147463794247}, "ground_truth": 1}, {"key": "36101833", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9825258354117158, "res": {"Yes": 0.9825258354117158, "No": 0.01747075393125569}, "ground_truth": 0}, {"key": "36101833", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9629651912453197, "res": {"Yes": 0.9629651912453197, "No": 0.03703125474787433}, "ground_truth": 0}, {"key": "35544662", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.15015143912749926, "res": {"No": 0.849845220167053, "Yes": 0.15015143912749926}, "ground_truth": 0}, {"key": "35544662", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9301761241115512, "res": {"Yes": 0.9301761241115512, "No": 0.06980766929242581}, "ground_truth": 0}, {"key": "35544662", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7283147538747861, "res": {"Yes": 0.7283147538747861, "No": 0.271646225716938}, "ground_truth": 1}, {"key": "35544662", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9709349808037532, "res": {"Yes": 0.9709349808037532, "No": 0.029056815804074352}, "ground_truth": 0}, {"key": "35544662", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.913027836321825, "res": {"Yes": 0.913027836321825, "No": 0.08696827343481735}, "ground_truth": 0}, {"key": "39759044", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9993219875543854, "res": {"Yes": 0.9993219875543854, "No": 0.0006776485955733544}, "ground_truth": 0}, {"key": "39759044", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9959112233030607, "res": {"Yes": 0.9959112233030607, "No": 0.004087940422252181}, "ground_truth": 0}, {"key": "39759044", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9921625914068097, "res": {"Yes": 0.9921625914068097, "No": 0.007836706673722217}, "ground_truth": 1}, {"key": "39759044", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9913600968496192, "res": {"Yes": 0.9913600968496192, "No": 0.008639138601818799}, "ground_truth": 0}, {"key": "39759044", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9970375088627943, "res": {"Yes": 0.9970375088627943, "No": 0.0029619764911036966}, "ground_truth": 0}, {"key": "39433018", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09341904935433866, "res": {"No": 0.9065791089812891, "Yes": 0.09341904935433866}, "ground_truth": 0}, {"key": "39433018", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9965861046374452, "res": {"Yes": 0.9965861046374452, "No": 0.00341246969191708}, "ground_truth": 0}, {"key": "39433018", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9790225646941821, "res": {"Yes": 0.9790225646941821, "No": 0.020977077186387173}, "ground_truth": 1}, {"key": "39433018", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996225448341318, "res": {"Yes": 0.9996225448341318, "No": 0.00037599853908280476}, "ground_truth": 0}, {"key": "39433018", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9986585265809607, "res": {"Yes": 0.9986585265809607, "No": 0.0013401438768494173}, "ground_truth": 0}, {"key": "22111959", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999444974303247, "res": {"Yes": 0.9999444974303247, "No": 5.487391274874166e-05}, "ground_truth": 0}, {"key": "22111959", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999907469518097, "res": {"Yes": 0.9999907469518097, "No": 8.753718293770816e-06}, "ground_truth": 0}, {"key": "22111959", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998324694848043, "res": {"Yes": 0.9998324694848043, "No": 0.00016741697520537718}, "ground_truth": 1}, {"key": "22111959", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999790998093942, "res": {"Yes": 0.999790998093942, "No": 0.00020886342259866529}, "ground_truth": 0}, {"key": "22111959", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.998587190855839, "res": {"Yes": 0.998587190855839, "No": 0.001412088450324686}, "ground_truth": 0}, {"key": "38210094", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.947988317609288, "res": {"Yes": 0.947988317609288, "No": 0.052008495434726826}, "ground_truth": 0}, {"key": "38210094", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980032918791608, "res": {"Yes": 0.9980032918791608, "No": 0.0019939154710320386}, "ground_truth": 0}, {"key": "38210094", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9935471337418557, "res": {"Yes": 0.9935471337418557, "No": 0.006447569763673501}, "ground_truth": 1}, {"key": "38210094", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7961898154058944, "res": {"Yes": 0.7961898154058944, "No": 0.20380796021529268}, "ground_truth": 0}, {"key": "38210094", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984304299654706, "res": {"Yes": 0.9984304299654706, "No": 0.0015689949874158247}, "ground_truth": 0}, {"key": "37675935", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9973100227900179, "res": {"Yes": 0.9973100227900179, "No": 0.0026896631937279427}, "ground_truth": 0}, {"key": "37675935", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9003093342396836, "res": {"Yes": 0.9003093342396836, "No": 0.09969009051332979}, "ground_truth": 0}, {"key": "37675935", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9940662416967361, "res": {"Yes": 0.9940662416967361, "No": 0.005933638969294736}, "ground_truth": 1}, {"key": "37675935", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9842098770381258, "res": {"Yes": 0.9842098770381258, "No": 0.015789643950797665}, "ground_truth": 0}, {"key": "37675935", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9853126046823222, "res": {"Yes": 0.9853126046823222, "No": 0.014686927008881695}, "ground_truth": 0}, {"key": "35732604", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9925880460202456, "res": {"Yes": 0.9925880460202456, "No": 0.0074102929947778085}, "ground_truth": 0}, {"key": "35732604", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9244093924896354, "res": {"Yes": 0.9244093924896354, "No": 0.07558432186813813}, "ground_truth": 0}, {"key": "35732604", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974932423774633, "res": {"Yes": 0.9974932423774633, "No": 0.0025058005867402097}, "ground_truth": 1}, {"key": "35732604", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9819920474305746, "res": {"Yes": 0.9819920474305746, "No": 0.018005032082801367}, "ground_truth": 0}, {"key": "35732604", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.851481879318619, "res": {"Yes": 0.851481879318619, "No": 0.1485014138365287}, "ground_truth": 0}, {"key": "27453212", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9957961898514929, "res": {"Yes": 0.9957961898514929, "No": 0.00420337291914034}, "ground_truth": 0}, {"key": "27453212", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9928838694206258, "res": {"Yes": 0.9928838694206258, "No": 0.0071148409633153345}, "ground_truth": 0}, {"key": "27453212", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9970885774347901, "res": {"Yes": 0.9970885774347901, "No": 0.0029104924072502593}, "ground_truth": 1}, {"key": "27453212", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9949670513429733, "res": {"Yes": 0.9949670513429733, "No": 0.005031691847662462}, "ground_truth": 0}, {"key": "27453212", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9792721767737568, "res": {"Yes": 0.9792721767737568, "No": 0.020725005760737932}, "ground_truth": 0}, {"key": "39910047", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.012985621137624102, "res": {"No": 0.9870136577550177, "Yes": 0.012985621137624102}, "ground_truth": 0}, {"key": "39910047", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9495460050824227, "res": {"Yes": 0.9495460050824227, "No": 0.05045306907695647}, "ground_truth": 0}, {"key": "39910047", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.20720422041624068, "res": {"No": 0.7927934324453322, "Yes": 0.20720422041624068}, "ground_truth": 1}, {"key": "39910047", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3453930621129856, "res": {"No": 0.6546063083549928, "Yes": 0.3453930621129856}, "ground_truth": 0}, {"key": "39910047", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.19193789938033712, "res": {"No": 0.8080609743530691, "Yes": 0.19193789938033712}, "ground_truth": 0}, {"key": "40054265", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998977732755078, "res": {"Yes": 0.9998977732755078, "No": 0.00010209600110654544}, "ground_truth": 0}, {"key": "40054265", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999839524287637, "res": {"Yes": 0.9999839524287637, "No": 1.58468312304058e-05}, "ground_truth": 0}, {"key": "40054265", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999964686909351, "res": {"Yes": 0.9999964686909351, "No": 3.342040531323541e-06}, "ground_truth": 1}, {"key": "40054265", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999101692710216, "res": {"Yes": 0.9999101692710216, "No": 8.956150159648004e-05}, "ground_truth": 0}, {"key": "40054265", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997944542874151, "res": {"Yes": 0.9997944542874151, "No": 0.0002044815104533521}, "ground_truth": 0}, {"key": "19984615", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.19410562680902904, "res": {"No": 0.8058908237941238, "Yes": 0.19410562680902904}, "ground_truth": 0}, {"key": "19984615", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.003204410938633212, "res": {"No": 0.996768576922492, "Yes": 0.003204410938633212}, "ground_truth": 0}, {"key": "19984615", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 7.445132513500331e-05, "res": {"No": 0.9999183936139823, "Yes": 7.445132513500331e-05}, "ground_truth": 1}, {"key": "19984615", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.019999446116232743, "res": {"No": 0.9799902954192198, "Yes": 0.019999446116232743}, "ground_truth": 0}, {"key": "19984615", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.008372489561976554, "res": {"No": 0.9915958767583769, "Yes": 0.008372489561976554}, "ground_truth": 0}, {"key": "16490806", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9301803564225444, "res": {"Yes": 0.9301803564225444, "No": 0.06981943985769927}, "ground_truth": 0}, {"key": "16490806", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998596400713766, "res": {"Yes": 0.9998596400713766, "No": 0.00013997566106559728}, "ground_truth": 0}, {"key": "16490806", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999809723900273, "res": {"Yes": 0.9999809723900273, "No": 1.883375159768426e-05}, "ground_truth": 1}, {"key": "16490806", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978083646475392, "res": {"Yes": 0.9978083646475392, "No": 0.0021911312850792118}, "ground_truth": 0}, {"key": "16490806", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996687611716981, "res": {"Yes": 0.9996687611716981, "No": 0.00033043849923413657}, "ground_truth": 0}, {"key": "36396237", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9708492384089332, "res": {"Yes": 0.9708492384089332, "No": 0.029149940714371568}, "ground_truth": 0}, {"key": "36396237", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8105980584434204, "res": {"Yes": 0.8105980584434204, "No": 0.18940077620638265}, "ground_truth": 0}, {"key": "36396237", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997881377959671, "res": {"Yes": 0.9997881377959671, "No": 0.0002116943645836336}, "ground_truth": 1}, {"key": "36396237", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992260487548871, "res": {"Yes": 0.9992260487548871, "No": 0.0007738244646137359}, "ground_truth": 0}, {"key": "36396237", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996857981117554, "res": {"Yes": 0.9996857981117554, "No": 0.00031407649094073993}, "ground_truth": 0}, {"key": "40726444", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.005124686123644976, "res": {"No": 0.9948702866477136, "Yes": 0.005124686123644976}, "ground_truth": 0}, {"key": "40726444", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9270853189029281, "res": {"Yes": 0.9270853189029281, "No": 0.07291360732342825}, "ground_truth": 0}, {"key": "40726444", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9919533976263682, "res": {"Yes": 0.9919533976263682, "No": 0.008045559135165838}, "ground_truth": 1}, {"key": "40726444", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9983348954274179, "res": {"Yes": 0.9983348954274179, "No": 0.0016643721728884975}, "ground_truth": 0}, {"key": "40726444", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.19919564430688386, "res": {"No": 0.8007994962818443, "Yes": 0.19919564430688386}, "ground_truth": 0}, {"key": "37314826", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999704827216435, "res": {"Yes": 0.9999704827216435, "No": 2.8914828429137628e-05}, "ground_truth": 0}, {"key": "37314826", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998916945254614, "res": {"Yes": 0.9998916945254614, "No": 0.0001076885815838043}, "ground_truth": 0}, {"key": "37314826", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997479901398207, "res": {"Yes": 0.9997479901398207, "No": 0.00025191394924939197}, "ground_truth": 1}, {"key": "37314826", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996853214516837, "res": {"Yes": 0.9996853214516837, "No": 0.00031364775534719236}, "ground_truth": 0}, {"key": "37314826", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990620622388586, "res": {"Yes": 0.9990620622388586, "No": 0.0009373498246415849}, "ground_truth": 0}, {"key": "38506971", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.16653589620093798, "res": {"No": 0.8334629074009148, "Yes": 0.16653589620093798}, "ground_truth": 0}, {"key": "38506971", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992312859721322, "res": {"Yes": 0.9992312859721322, "No": 0.0007686298836209831}, "ground_truth": 0}, {"key": "38506971", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9847217007902537, "res": {"Yes": 0.9847217007902537, "No": 0.015277158111635263}, "ground_truth": 1}, {"key": "38506971", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9924450090048724, "res": {"Yes": 0.9924450090048724, "No": 0.007554466509346825}, "ground_truth": 0}, {"key": "38506971", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988641217985714, "res": {"Yes": 0.9988641217985714, "No": 0.0011326763446656528}, "ground_truth": 0}, {"key": "40699312", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9992613997995121, "res": {"Yes": 0.9992613997995121, "No": 0.0007382766050458186}, "ground_truth": 0}, {"key": "40699312", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9966463657357189, "res": {"Yes": 0.9966463657357189, "No": 0.0033535962549618705}, "ground_truth": 0}, {"key": "40699312", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999218502438513, "res": {"Yes": 0.9999218502438513, "No": 7.791305753054547e-05}, "ground_truth": 1}, {"key": "40699312", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9983925266714769, "res": {"Yes": 0.9983925266714769, "No": 0.0016071706599696267}, "ground_truth": 0}, {"key": "40699312", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.986583458983116, "res": {"Yes": 0.986583458983116, "No": 0.013415869254488948}, "ground_truth": 0}, {"key": "34695474", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5934238380246185, "res": {"Yes": 0.5934238380246185, "No": 0.406573847429661}, "ground_truth": 0}, {"key": "34695474", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9811431554300365, "res": {"Yes": 0.9811431554300365, "No": 0.018854814246580098}, "ground_truth": 0}, {"key": "34695474", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.994882091351134, "res": {"Yes": 0.994882091351134, "No": 0.005117204423930793}, "ground_truth": 1}, {"key": "34695474", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9806827443272047, "res": {"Yes": 0.9806827443272047, "No": 0.019315863068798133}, "ground_truth": 0}, {"key": "34695474", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.15543915657131757, "res": {"No": 0.8445541449397729, "Yes": 0.15543915657131757}, "ground_truth": 0}, {"key": "36281498", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9954838630537761, "res": {"Yes": 0.9954838630537761, "No": 0.004515429361305161}, "ground_truth": 0}, {"key": "36281498", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998865693437434, "res": {"Yes": 0.9998865693437434, "No": 0.0001131596391934128}, "ground_truth": 0}, {"key": "36281498", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999132682854126, "res": {"Yes": 0.9999132682854126, "No": 8.644103956183499e-05}, "ground_truth": 1}, {"key": "36281498", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998079216094166, "res": {"Yes": 0.9998079216094166, "No": 0.00019166854612759636}, "ground_truth": 0}, {"key": "36281498", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982551851623549, "res": {"Yes": 0.9982551851623549, "No": 0.0017440482283627276}, "ground_truth": 0}, {"key": "39558652", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.897711630873586, "res": {"Yes": 0.897711630873586, "No": 0.10228784809811277}, "ground_truth": 0}, {"key": "39558652", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5481704501376423, "res": {"Yes": 0.5481704501376423, "No": 0.4518287240746683}, "ground_truth": 0}, {"key": "39558652", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9543754896033192, "res": {"Yes": 0.9543754896033192, "No": 0.045624026695883085}, "ground_truth": 1}, {"key": "39558652", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6995554969475751, "res": {"Yes": 0.6995554969475751, "No": 0.30044381926692565}, "ground_truth": 0}, {"key": "39558652", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9511945625811546, "res": {"Yes": 0.9511945625811546, "No": 0.0488045857622539}, "ground_truth": 0}, {"key": "37330579", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.004860101288654388, "res": {"No": 0.9951391446812871, "Yes": 0.004860101288654388}, "ground_truth": 0}, {"key": "37330579", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.39067894454145535, "res": {"No": 0.6093180061337354, "Yes": 0.39067894454145535}, "ground_truth": 1}, {"key": "37330579", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7022154171442518, "res": {"Yes": 0.7022154171442518, "No": 0.2977828051468887}, "ground_truth": 0}, {"key": "37330579", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.2701860454641765, "res": {"No": 0.7298085350461591, "Yes": 0.2701860454641765}, "ground_truth": 0}, {"key": "40547658", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06886810675015964, "res": {"No": 0.9311302343205816, "Yes": 0.06886810675015964}, "ground_truth": 0}, {"key": "40547658", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8703095117231356, "res": {"Yes": 0.8703095117231356, "No": 0.12968951906296836}, "ground_truth": 0}, {"key": "40547658", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8395092030394266, "res": {"Yes": 0.8395092030394266, "No": 0.1604861713399087}, "ground_truth": 1}, {"key": "40547658", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9832130940796343, "res": {"Yes": 0.9832130940796343, "No": 0.01678456608902272}, "ground_truth": 0}, {"key": "40547658", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.02362717373235131, "res": {"No": 0.9763690705430845, "Yes": 0.02362717373235131}, "ground_truth": 0}, {"key": "37119340", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0004176804046744666, "res": {"No": 0.9995821655371427, "Yes": 0.0004176804046744666}, "ground_truth": 0}, {"key": "37119340", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9863195575584882, "res": {"Yes": 0.9863195575584882, "No": 0.013679895578054723}, "ground_truth": 0}, {"key": "37119340", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9952162404004653, "res": {"Yes": 0.9952162404004653, "No": 0.00478346404182924}, "ground_truth": 1}, {"key": "37119340", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9972131597689947, "res": {"Yes": 0.9972131597689947, "No": 0.0027865778864237197}, "ground_truth": 0}, {"key": "37119340", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9931007443017406, "res": {"Yes": 0.9931007443017406, "No": 0.006896973408895246}, "ground_truth": 0}, {"key": "35301627", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6641843450167242, "res": {"Yes": 0.6641843450167242, "No": 0.33581505570843817}, "ground_truth": 0}, {"key": "35301627", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.050272282374038586, "res": {"No": 0.9497233854473661, "Yes": 0.050272282374038586}, "ground_truth": 0}, {"key": "35301627", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.995143500713399, "res": {"Yes": 0.995143500713399, "No": 0.004854915413231481}, "ground_truth": 1}, {"key": "35301627", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.04389373411296484, "res": {"No": 0.9560981087316038, "Yes": 0.04389373411296484}, "ground_truth": 0}, {"key": "35301627", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1111646325903557, "res": {"No": 0.8888078131700313, "Yes": 0.1111646325903557}, "ground_truth": 0}, {"key": "34037168", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08094158154536704, "res": {"No": 0.9190379799544939, "Yes": 0.08094158154536704}, "ground_truth": 0}, {"key": "34037168", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.997639987219422, "res": {"Yes": 0.997639987219422, "No": 0.0023594257873366027}, "ground_truth": 0}, {"key": "34037168", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9917937783858156, "res": {"Yes": 0.9917937783858156, "No": 0.0082031701152623}, "ground_truth": 1}, {"key": "34037168", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996844872846088, "res": {"Yes": 0.9996844872846088, "No": 0.0003144070732650245}, "ground_truth": 0}, {"key": "34037168", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.836105197068375, "res": {"Yes": 0.836105197068375, "No": 0.16381756154019508}, "ground_truth": 0}, {"key": "39703862", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9887274971962181, "res": {"Yes": 0.9887274971962181, "No": 0.011271644987026973}, "ground_truth": 0}, {"key": "39703862", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9942199982573088, "res": {"Yes": 0.9942199982573088, "No": 0.00577961619934461}, "ground_truth": 0}, {"key": "39703862", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7108621143381461, "res": {"Yes": 0.7108621143381461, "No": 0.2891358303715712}, "ground_truth": 1}, {"key": "39703862", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5976080946445468, "res": {"Yes": 0.5976080946445468, "No": 0.4023907288899176}, "ground_truth": 0}, {"key": "39703862", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9784972456692436, "res": {"Yes": 0.9784972456692436, "No": 0.02150210159545052}, "ground_truth": 0}, {"key": "16554814", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0015721685038112686, "res": {"No": 0.9984221097798359, "Yes": 0.0015721685038112686}, "ground_truth": 0}, {"key": "16554814", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5115831068772562, "res": {"Yes": 0.5115831068772562, "No": 0.48836089867185556}, "ground_truth": 0}, {"key": "16554814", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6207765156504378, "res": {"Yes": 0.6207765156504378, "No": 0.3792183949077537}, "ground_truth": 1}, {"key": "16554814", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.006901249478031016, "res": {"No": 0.9930950981428193, "Yes": 0.006901249478031016}, "ground_truth": 0}, {"key": "16554814", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9686877639914686, "res": {"Yes": 0.9686877639914686, "No": 0.031309459708149835}, "ground_truth": 0}, {"key": "32983099", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9909156711254545, "res": {"Yes": 0.9909156711254545, "No": 0.009083646228136398}, "ground_truth": 0}, {"key": "32983099", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998808482291361, "res": {"Yes": 0.9998808482291361, "No": 0.00011864662743147158}, "ground_truth": 0}, {"key": "32983099", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997398900344643, "res": {"Yes": 0.9997398900344643, "No": 0.0002596367549873722}, "ground_truth": 1}, {"key": "32983099", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995148678646674, "res": {"Yes": 0.9995148678646674, "No": 0.0004848657545906287}, "ground_truth": 0}, {"key": "32983099", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9952856638320268, "res": {"Yes": 0.9952856638320268, "No": 0.0047141248022951115}, "ground_truth": 0}, {"key": "41072994", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8764777850566974, "res": {"Yes": 0.8764777850566974, "No": 0.12351919622161972}, "ground_truth": 0}, {"key": "41072994", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.18052281686026986, "res": {"No": 0.819449340730042, "Yes": 0.18052281686026986}, "ground_truth": 0}, {"key": "41072994", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4050354033569315, "res": {"No": 0.5949383453893048, "Yes": 0.4050354033569315}, "ground_truth": 1}, {"key": "41072994", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.16735827588383057, "res": {"No": 0.8326344988473342, "Yes": 0.16735827588383057}, "ground_truth": 0}, {"key": "41072994", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.020714562989633895, "res": {"No": 0.9792345616933424, "Yes": 0.020714562989633895}, "ground_truth": 0}, {"key": "38396247", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.001173455692613465, "res": {"No": 0.9988262991262985, "Yes": 0.001173455692613465}, "ground_truth": 0}, {"key": "38396247", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9973102606484867, "res": {"Yes": 0.9973102606484867, "No": 0.0026893358816346127}, "ground_truth": 0}, {"key": "38396247", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997752702855062, "res": {"Yes": 0.9997752702855062, "No": 0.00022456687745980863}, "ground_truth": 1}, {"key": "38396247", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998679679990438, "res": {"Yes": 0.998679679990438, "No": 0.00132029576907786}, "ground_truth": 0}, {"key": "38396247", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999684368122225, "res": {"Yes": 0.999684368122225, "No": 0.0003154258270928963}, "ground_truth": 0}, {"key": "37507998", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 6.153700763231212e-07, "res": {"No": 0.9999992103693117, "Yes": 6.153700763231212e-07}, "ground_truth": 0}, {"key": "37507998", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.21207680122177355, "res": {"No": 0.7878768130197463, "Yes": 0.21207680122177355}, "ground_truth": 0}, {"key": "37507998", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3023632711169399, "res": {"No": 0.6975394344771242, "Yes": 0.3023632711169399}, "ground_truth": 1}, {"key": "37507998", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.24297862560101244, "res": {"No": 0.7570122601266085, "Yes": 0.24297862560101244}, "ground_truth": 0}, {"key": "37507998", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.001888702865655808, "res": {"No": 0.9981106376962937, "Yes": 0.001888702865655808}, "ground_truth": 0}, {"key": "32593929", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9952224954537147, "res": {"Yes": 0.9952224954537147, "No": 0.004773850819917562}, "ground_truth": 0}, {"key": "32593929", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9969405825848343, "res": {"Yes": 0.9969405825848343, "No": 0.0030588865554587253}, "ground_truth": 0}, {"key": "32593929", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983568749105903, "res": {"Yes": 0.9983568749105903, "No": 0.0016421587364492604}, "ground_truth": 1}, {"key": "32593929", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971876723235623, "res": {"Yes": 0.9971876723235623, "No": 0.002809948846204128}, "ground_truth": 0}, {"key": "32593929", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.995965025474028, "res": {"Yes": 0.995965025474028, "No": 0.004034448764901491}, "ground_truth": 0}, {"key": "36056449", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999565364005696, "res": {"Yes": 0.9999565364005696, "No": 4.324884630374895e-05}, "ground_truth": 0}, {"key": "36056449", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999775151112301, "res": {"Yes": 0.999775151112301, "No": 0.0002239006793941373}, "ground_truth": 0}, {"key": "36056449", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999814491960682, "res": {"Yes": 0.9999814491960682, "No": 1.841047061567718e-05}, "ground_truth": 1}, {"key": "36056449", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999583243784529, "res": {"Yes": 0.9999583243784529, "No": 4.098132839452119e-05}, "ground_truth": 0}, {"key": "36056449", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999987886094374, "res": {"Yes": 0.999987886094374, "No": 1.1863477439426888e-05}, "ground_truth": 0}, {"key": "21986185", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7919459456015312, "res": {"Yes": 0.7919459456015312, "No": 0.20804422535138273}, "ground_truth": 0}, {"key": "21986185", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985636588268085, "res": {"Yes": 0.9985636588268085, "No": 0.0014360001555993752}, "ground_truth": 0}, {"key": "21986185", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9908839484589466, "res": {"Yes": 0.9908839484589466, "No": 0.009115463699605815}, "ground_truth": 1}, {"key": "21986185", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9897903044263018, "res": {"Yes": 0.9897903044263018, "No": 0.010209243944879287}, "ground_truth": 0}, {"key": "21986185", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9845819491569697, "res": {"Yes": 0.9845819491569697, "No": 0.015417417533533618}, "ground_truth": 0}, {"key": "40757465", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9070928895986475, "res": {"Yes": 0.9070928895986475, "No": 0.0929060696490543}, "ground_truth": 0}, {"key": "40757465", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9234110521569411, "res": {"Yes": 0.9234110521569411, "No": 0.07658642019511638}, "ground_truth": 0}, {"key": "40757465", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.989378784709789, "res": {"Yes": 0.989378784709789, "No": 0.010620714358872569}, "ground_truth": 1}, {"key": "40757465", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.991289559627158, "res": {"Yes": 0.991289559627158, "No": 0.008709798697831632}, "ground_truth": 0}, {"key": "40757465", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8511049606501442, "res": {"Yes": 0.8511049606501442, "No": 0.14889335016909885}, "ground_truth": 0}, {"key": "35198313", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9967709494338822, "res": {"Yes": 0.9967709494338822, "No": 0.003227986857465029}, "ground_truth": 0}, {"key": "35198313", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9892674720074423, "res": {"Yes": 0.9892674720074423, "No": 0.01073142420521299}, "ground_truth": 0}, {"key": "35198313", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968838320614619, "res": {"Yes": 0.9968838320614619, "No": 0.0031151873004344}, "ground_truth": 1}, {"key": "35198313", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974690443826592, "res": {"Yes": 0.9974690443826592, "No": 0.0025302909066174054}, "ground_truth": 0}, {"key": "35198313", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9908283525112136, "res": {"Yes": 0.9908283525112136, "No": 0.009171036201725734}, "ground_truth": 0}, {"key": "30604618", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0929688210097567, "res": {"No": 0.907030701441971, "Yes": 0.0929688210097567}, "ground_truth": 0}, {"key": "30604618", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9934636991570313, "res": {"Yes": 0.9934636991570313, "No": 0.00653619556935595}, "ground_truth": 0}, {"key": "30604618", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9946242210939893, "res": {"Yes": 0.9946242210939893, "No": 0.0053750951650476525}, "ground_truth": 1}, {"key": "30604618", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9693576920136537, "res": {"Yes": 0.9693576920136537, "No": 0.030642011095120127}, "ground_truth": 0}, {"key": "30604618", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8969392185796281, "res": {"Yes": 0.8969392185796281, "No": 0.10305837538342216}, "ground_truth": 0}, {"key": "35779006", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9933023012411949, "res": {"Yes": 0.9933023012411949, "No": 0.006697007460825296}, "ground_truth": 0}, {"key": "35779006", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984320888590081, "res": {"Yes": 0.9984320888590081, "No": 0.0015677465643441422}, "ground_truth": 0}, {"key": "35779006", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992686511660225, "res": {"Yes": 0.9992686511660225, "No": 0.0007311938124833331}, "ground_truth": 1}, {"key": "35779006", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9936840118382694, "res": {"Yes": 0.9936840118382694, "No": 0.0063158937821236475}, "ground_truth": 0}, {"key": "35779006", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987419889601543, "res": {"Yes": 0.9987419889601543, "No": 0.0012578391381311625}, "ground_truth": 0}, {"key": "33858956", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.738182422475997, "res": {"Yes": 0.738182422475997, "No": 0.2618140918968075}, "ground_truth": 0}, {"key": "33858956", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7769289610611022, "res": {"Yes": 0.7769289610611022, "No": 0.223049468563457}, "ground_truth": 0}, {"key": "33858956", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9209472638772938, "res": {"Yes": 0.9209472638772938, "No": 0.07904970082213829}, "ground_truth": 1}, {"key": "33858956", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9431427087151129, "res": {"Yes": 0.9431427087151129, "No": 0.05685377830751037}, "ground_truth": 0}, {"key": "33858956", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9968939036296937, "res": {"Yes": 0.9968939036296937, "No": 0.003105821578642846}, "ground_truth": 0}, {"key": "38633880", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6732164374998789, "res": {"Yes": 0.6732164374998789, "No": 0.3267829467125456}, "ground_truth": 0}, {"key": "38633880", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9949316429861151, "res": {"Yes": 0.9949316429861151, "No": 0.0050669359154637975}, "ground_truth": 0}, {"key": "38633880", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997921898755158, "res": {"Yes": 0.9997921898755158, "No": 0.00020700036529299574}, "ground_truth": 1}, {"key": "38633880", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998275139883994, "res": {"Yes": 0.998275139883994, "No": 0.0017244150283689153}, "ground_truth": 0}, {"key": "38633880", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9908490734257978, "res": {"Yes": 0.9908490734257978, "No": 0.009146838303579667}, "ground_truth": 0}, {"key": "36654905", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9485442339562127, "res": {"Yes": 0.9485442339562127, "No": 0.05145568639853716}, "ground_truth": 0}, {"key": "36654905", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9957679373236303, "res": {"Yes": 0.9957679373236303, "No": 0.00423158564157782}, "ground_truth": 0}, {"key": "36654905", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9859518502398859, "res": {"Yes": 0.9859518502398859, "No": 0.01404583315200258}, "ground_truth": 1}, {"key": "36654905", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9673696227560608, "res": {"Yes": 0.9673696227560608, "No": 0.03262992718221975}, "ground_truth": 0}, {"key": "36654905", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9702287485880495, "res": {"Yes": 0.9702287485880495, "No": 0.029770425831769573}, "ground_truth": 0}, {"key": "26547482", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4553958218846939, "res": {"No": 0.544603049083689, "Yes": 0.4553958218846939}, "ground_truth": 0}, {"key": "26547482", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.986722949052908, "res": {"Yes": 0.986722949052908, "No": 0.013276379501535675}, "ground_truth": 0}, {"key": "26547482", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9515368106750339, "res": {"Yes": 0.9515368106750339, "No": 0.048462169292305776}, "ground_truth": 1}, {"key": "26547482", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9125185271550927, "res": {"Yes": 0.9125185271550927, "No": 0.08747891378276758}, "ground_truth": 0}, {"key": "26547482", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9695208127701941, "res": {"Yes": 0.9695208127701941, "No": 0.03047695057258227}, "ground_truth": 0}, {"key": "36439068", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996014650261688, "res": {"Yes": 0.9996014650261688, "No": 0.0003980838087893479}, "ground_truth": 0}, {"key": "36439068", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.35964012510639354, "res": {"No": 0.6403554795688692, "Yes": 0.35964012510639354}, "ground_truth": 0}, {"key": "36439068", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9951465741193325, "res": {"Yes": 0.9951465741193325, "No": 0.004850969971040093}, "ground_truth": 1}, {"key": "36439068", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99719633163975, "res": {"Yes": 0.99719633163975, "No": 0.0028032172599784123}, "ground_truth": 0}, {"key": "36439068", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.997618153309117, "res": {"Yes": 0.997618153309117, "No": 0.0023814738934812736}, "ground_truth": 0}, {"key": "30501258", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.39590784874385354, "res": {"No": 0.6040444264663691, "Yes": 0.39590784874385354}, "ground_truth": 0}, {"key": "30501258", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.566223388112551, "res": {"Yes": 0.566223388112551, "No": 0.4337660697466852}, "ground_truth": 0}, {"key": "30501258", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9813222009563297, "res": {"Yes": 0.9813222009563297, "No": 0.018666515036364337}, "ground_truth": 1}, {"key": "30501258", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5970933933813193, "res": {"Yes": 0.5970933933813193, "No": 0.4028993097462015}, "ground_truth": 0}, {"key": "30501258", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5542160645806434, "res": {"Yes": 0.5542160645806434, "No": 0.44572961285921864}, "ground_truth": 0}, {"key": "37560941", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.02546512525361745, "res": {"No": 0.9745338820386438, "Yes": 0.02546512525361745}, "ground_truth": 0}, {"key": "37560941", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.989968904443327, "res": {"Yes": 0.989968904443327, "No": 0.010030826275425762}, "ground_truth": 0}, {"key": "37560941", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99820469379362, "res": {"Yes": 0.99820469379362, "No": 0.001795219464805487}, "ground_truth": 1}, {"key": "37560941", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997060529109136, "res": {"Yes": 0.9997060529109136, "No": 0.00029352918083784833}, "ground_truth": 0}, {"key": "37560941", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974418895552825, "res": {"Yes": 0.9974418895552825, "No": 0.002557899154949474}, "ground_truth": 0}, {"key": "36801665", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6364250507998048, "res": {"Yes": 0.6364250507998048, "No": 0.36357150094135654}, "ground_truth": 0}, {"key": "36801665", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.991304907882228, "res": {"Yes": 0.991304907882228, "No": 0.008690283643664028}, "ground_truth": 0}, {"key": "36801665", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9867498820233684, "res": {"Yes": 0.9867498820233684, "No": 0.01324441930236866}, "ground_truth": 1}, {"key": "36801665", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.11199460259100663, "res": {"No": 0.8880044186900844, "Yes": 0.11199460259100663}, "ground_truth": 0}, {"key": "36801665", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9562491487862095, "res": {"Yes": 0.9562491487862095, "No": 0.043741354374672095}, "ground_truth": 0}, {"key": "34954610", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4935204412469309, "res": {"No": 0.5064762939708878, "Yes": 0.4935204412469309}, "ground_truth": 0}, {"key": "34954610", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9977682580474758, "res": {"Yes": 0.9977682580474758, "No": 0.0022313950637139726}, "ground_truth": 0}, {"key": "34954610", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995228506919551, "res": {"Yes": 0.9995228506919551, "No": 0.00047669198948299603}, "ground_truth": 1}, {"key": "34954610", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.87204073649529, "res": {"Yes": 0.87204073649529, "No": 0.12795140955311665}, "ground_truth": 0}, {"key": "34954610", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995332128190508, "res": {"Yes": 0.9995332128190508, "No": 0.00046541806117296567}, "ground_truth": 0}, {"key": "37020510", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9921893498966486, "res": {"Yes": 0.9921893498966486, "No": 0.007809346448516105}, "ground_truth": 0}, {"key": "37020510", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9944123463338806, "res": {"Yes": 0.9944123463338806, "No": 0.005584507684184545}, "ground_truth": 0}, {"key": "37020510", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9098812568167254, "res": {"Yes": 0.9098812568167254, "No": 0.09011450856255498}, "ground_truth": 1}, {"key": "37020510", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9973065789847242, "res": {"Yes": 0.9973065789847242, "No": 0.0026930936241835743}, "ground_truth": 0}, {"key": "37020510", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9766972638068195, "res": {"Yes": 0.9766972638068195, "No": 0.023299683551113178}, "ground_truth": 0}, {"key": "38064637", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9976300162566337, "res": {"Yes": 0.9976300162566337, "No": 0.0023688894977424765}, "ground_truth": 0}, {"key": "38064637", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996634024416733, "res": {"Yes": 0.9996634024416733, "No": 0.0003363990681280384}, "ground_truth": 0}, {"key": "38064637", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996624491131241, "res": {"Yes": 0.9996624491131241, "No": 0.0003372673563016675}, "ground_truth": 1}, {"key": "38064637", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998375943892193, "res": {"Yes": 0.9998375943892193, "No": 0.0001621841726933527}, "ground_truth": 0}, {"key": "38064637", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981454296447854, "res": {"Yes": 0.9981454296447854, "No": 0.0018543788328472303}, "ground_truth": 0}, {"key": "40886108", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.025775295101703465, "res": {"No": 0.974224328620138, "Yes": 0.025775295101703465}, "ground_truth": 0}, {"key": "40886108", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.987511531309101, "res": {"Yes": 0.987511531309101, "No": 0.012487971224796507}, "ground_truth": 0}, {"key": "40886108", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.987096118294425, "res": {"Yes": 0.987096118294425, "No": 0.012903495955851205}, "ground_truth": 1}, {"key": "40886108", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9171671813352834, "res": {"Yes": 0.9171671813352834, "No": 0.08283191872715279}, "ground_truth": 0}, {"key": "40886108", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9872360944994132, "res": {"Yes": 0.9872360944994132, "No": 0.012763058952198095}, "ground_truth": 0}, {"key": "38554603", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.964555119505695, "res": {"Yes": 0.964555119505695, "No": 0.035444481786374146}, "ground_truth": 0}, {"key": "38554603", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9964900832094795, "res": {"Yes": 0.9964900832094795, "No": 0.003509767440384923}, "ground_truth": 0}, {"key": "38554603", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9863781318846148, "res": {"Yes": 0.9863781318846148, "No": 0.013621606958702933}, "ground_truth": 1}, {"key": "38554603", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990896662054474, "res": {"Yes": 0.9990896662054474, "No": 0.0009098225295001974}, "ground_truth": 0}, {"key": "38554603", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9972037907959278, "res": {"Yes": 0.9972037907959278, "No": 0.0027961159094936376}, "ground_truth": 0}, {"key": "39115586", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9918884129202034, "res": {"Yes": 0.9918884129202034, "No": 0.008111528155988623}, "ground_truth": 0}, {"key": "39115586", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994724857845738, "res": {"Yes": 0.9994724857845738, "No": 0.0005273816911231863}, "ground_truth": 0}, {"key": "39115586", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986065681289865, "res": {"Yes": 0.9986065681289865, "No": 0.0013931590676502963}, "ground_truth": 1}, {"key": "39115586", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999962302846054, "res": {"Yes": 0.9999962302846054, "No": 3.6913511559886364e-06}, "ground_truth": 0}, {"key": "39115586", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983016219790176, "res": {"Yes": 0.9983016219790176, "No": 0.0016982884995819431}, "ground_truth": 0}, {"key": "38786314", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9143736222278729, "res": {"Yes": 0.9143736222278729, "No": 0.08562294351767438}, "ground_truth": 0}, {"key": "38786314", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990165024510502, "res": {"Yes": 0.9990165024510502, "No": 0.000981378835658546}, "ground_truth": 0}, {"key": "38786314", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9981897267248299, "res": {"Yes": 0.9981897267248299, "No": 0.0018077198124706827}, "ground_truth": 1}, {"key": "38786314", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9967315042001876, "res": {"Yes": 0.9967315042001876, "No": 0.003267091955462686}, "ground_truth": 0}, {"key": "38786314", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988779155081291, "res": {"Yes": 0.9988779155081291, "No": 0.0011189699548643417}, "ground_truth": 0}, {"key": "38721078", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.510614355299422, "res": {"Yes": 0.510614355299422, "No": 0.48937936144545097}, "ground_truth": 0}, {"key": "38721078", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.989749420002609, "res": {"Yes": 0.989749420002609, "No": 0.010245845219612786}, "ground_truth": 0}, {"key": "38721078", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983568749105903, "res": {"Yes": 0.9983568749105903, "No": 0.0016417328157173326}, "ground_truth": 1}, {"key": "38721078", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9171393182195573, "res": {"Yes": 0.9171393182195573, "No": 0.08285090597878093}, "ground_truth": 0}, {"key": "38721078", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.005966683700352086, "res": {"No": 0.9940088817532903, "Yes": 0.005966683700352086}, "ground_truth": 0}, {"key": "39475467", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999892767243843, "res": {"Yes": 0.999892767243843, "No": 0.00010706782990518575}, "ground_truth": 0}, {"key": "39475467", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998794179605985, "res": {"Yes": 0.9998794179605985, "No": 0.00012037484204956394}, "ground_truth": 0}, {"key": "39475467", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990965701387126, "res": {"Yes": 0.9990965701387126, "No": 0.0009031205626538539}, "ground_truth": 1}, {"key": "39475467", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995122466503585, "res": {"Yes": 0.9995122466503585, "No": 0.00048753718183697177}, "ground_truth": 0}, {"key": "39475467", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998833512079994, "res": {"Yes": 0.9998833512079994, "No": 0.000116509353573138}, "ground_truth": 0}, {"key": "35691234", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.01746544362926739, "res": {"No": 0.9825341201044883, "Yes": 0.01746544362926739}, "ground_truth": 0}, {"key": "35691234", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9934731147538581, "res": {"Yes": 0.9934731147538581, "No": 0.00652664206475555}, "ground_truth": 0}, {"key": "35691234", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996871089606144, "res": {"Yes": 0.9996871089606144, "No": 0.00031272010522391026}, "ground_truth": 1}, {"key": "35691234", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999563108434926, "res": {"Yes": 0.999563108434926, "No": 0.00043670615640974857}, "ground_truth": 0}, {"key": "35691234", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995612020000143, "res": {"Yes": 0.9995612020000143, "No": 0.00043863716063478046}, "ground_truth": 0}, {"key": "36871390", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4496905947152574, "res": {"No": 0.5503086369802862, "Yes": 0.4496905947152574}, "ground_truth": 0}, {"key": "36871390", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8046052455798042, "res": {"Yes": 0.8046052455798042, "No": 0.19539193783989908}, "ground_truth": 0}, {"key": "36871390", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9934789996092828, "res": {"Yes": 0.9934789996092828, "No": 0.006520410140743529}, "ground_truth": 1}, {"key": "36871390", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9822590362932344, "res": {"Yes": 0.9822590362932344, "No": 0.01774018276020789}, "ground_truth": 0}, {"key": "36871390", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.39968881385849675, "res": {"No": 0.6003084575207989, "Yes": 0.39968881385849675}, "ground_truth": 0}, {"key": "31730844", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9705546216391152, "res": {"Yes": 0.9705546216391152, "No": 0.029444925285927875}, "ground_truth": 0}, {"key": "31730844", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9958146347568223, "res": {"Yes": 0.9958146347568223, "No": 0.00418497143764279}, "ground_truth": 0}, {"key": "31730844", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9908153618458443, "res": {"Yes": 0.9908153618458443, "No": 0.009184320889100645}, "ground_truth": 1}, {"key": "31730844", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9883436606981624, "res": {"Yes": 0.9883436606981624, "No": 0.011654586330533756}, "ground_truth": 0}, {"key": "31730844", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5857755109018377, "res": {"Yes": 0.5857755109018377, "No": 0.41422035015445224}, "ground_truth": 0}, {"key": "30810940", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9820064170253395, "res": {"Yes": 0.9820064170253395, "No": 0.01799314188637175}, "ground_truth": 0}, {"key": "30810940", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.988261807489166, "res": {"Yes": 0.988261807489166, "No": 0.011734007843928976}, "ground_truth": 0}, {"key": "30810940", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9925032523492144, "res": {"Yes": 0.9925032523492144, "No": 0.007493571944533828}, "ground_truth": 1}, {"key": "30810940", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9973537710528689, "res": {"Yes": 0.9973537710528689, "No": 0.0026451320249570058}, "ground_truth": 0}, {"key": "30810940", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991658241183089, "res": {"Yes": 0.9991658241183089, "No": 0.0008334265350249541}, "ground_truth": 0}, {"key": "39352003", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9655925641350072, "res": {"Yes": 0.9655925641350072, "No": 0.03440666442781343}, "ground_truth": 0}, {"key": "39352003", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8677569717399758, "res": {"Yes": 0.8677569717399758, "No": 0.13224137867125588}, "ground_truth": 0}, {"key": "39352003", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9609721266106183, "res": {"Yes": 0.9609721266106183, "No": 0.03902708057891955}, "ground_truth": 1}, {"key": "39352003", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9832090619310033, "res": {"Yes": 0.9832090619310033, "No": 0.016789817122514185}, "ground_truth": 0}, {"key": "39352003", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975022570638767, "res": {"Yes": 0.9975022570638767, "No": 0.002497444175109227}, "ground_truth": 0}, {"key": "40118123", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004457653823075822, "res": {"No": 0.9955421040475926, "Yes": 0.004457653823075822}, "ground_truth": 0}, {"key": "40118123", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999900037916542, "res": {"Yes": 0.999900037916542, "No": 9.974296809175156e-05}, "ground_truth": 0}, {"key": "40118123", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996475574924574, "res": {"Yes": 0.9996475574924574, "No": 0.00035238296677081606}, "ground_truth": 1}, {"key": "40118123", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999740587314805, "res": {"Yes": 0.9999740587314805, "No": 2.56189819197481e-05}, "ground_truth": 0}, {"key": "40118123", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996796051573934, "res": {"Yes": 0.9996796051573934, "No": 0.00031969664377456063}, "ground_truth": 0}, {"key": "37114191", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9990684894855352, "res": {"Yes": 0.9990684894855352, "No": 0.0009314497636246194}, "ground_truth": 0}, {"key": "37114191", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990960937396086, "res": {"Yes": 0.9990960937396086, "No": 0.0009037543239943561}, "ground_truth": 0}, {"key": "37114191", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997986255585553, "res": {"Yes": 0.9997986255585553, "No": 0.0002013175592224131}, "ground_truth": 1}, {"key": "37114191", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999129107124922, "res": {"Yes": 0.9999129107124922, "No": 8.69105612244325e-05}, "ground_truth": 0}, {"key": "37114191", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995881232445286, "res": {"Yes": 0.9995881232445286, "No": 0.0004116858497800491}, "ground_truth": 0}, {"key": "39268203", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0003005014436021655, "res": {"No": 0.9996984261325432, "Yes": 0.0003005014436021655}, "ground_truth": 0}, {"key": "39268203", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6481774548777355, "res": {"Yes": 0.6481774548777355, "No": 0.35181292771908323}, "ground_truth": 0}, {"key": "39268203", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1400542544021248, "res": {"No": 0.8599448411407128, "Yes": 0.1400542544021248}, "ground_truth": 1}, {"key": "39268203", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.42180097475454814, "res": {"No": 0.5781986408846145, "Yes": 0.42180097475454814}, "ground_truth": 0}, {"key": "39268203", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.41167190251875924, "res": {"No": 0.5883176828645754, "Yes": 0.41167190251875924}, "ground_truth": 0}, {"key": "37950968", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9873456739145389, "res": {"Yes": 0.9873456739145389, "No": 0.012653986185097244}, "ground_truth": 0}, {"key": "37950968", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9912229214351572, "res": {"Yes": 0.9912229214351572, "No": 0.008776715764723868}, "ground_truth": 0}, {"key": "37950968", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9963693567811823, "res": {"Yes": 0.9963693567811823, "No": 0.0036297445684478962}, "ground_truth": 1}, {"key": "37950968", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984178289543753, "res": {"Yes": 0.9984178289543753, "No": 0.001581497177370688}, "ground_truth": 0}, {"key": "37950968", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9861033326724357, "res": {"Yes": 0.9861033326724357, "No": 0.013896300852258873}, "ground_truth": 0}, {"key": "34959807", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998143573937215, "res": {"Yes": 0.9998143573937215, "No": 0.00018545820709121462}, "ground_truth": 0}, {"key": "34959807", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999268564151225, "res": {"Yes": 0.9999268564151225, "No": 7.242492861135442e-05}, "ground_truth": 0}, {"key": "34959807", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998278213244498, "res": {"Yes": 0.9998278213244498, "No": 0.0001712393966690354}, "ground_truth": 1}, {"key": "34959807", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998554685256801, "res": {"Yes": 0.9998554685256801, "No": 0.00014360084743638205}, "ground_truth": 0}, {"key": "34959807", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998535615431577, "res": {"Yes": 0.9998535615431577, "No": 0.00014583247887423238}, "ground_truth": 0}, {"key": "35631314", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0002670045122217219, "res": {"No": 0.9997328588885428, "Yes": 0.0002670045122217219}, "ground_truth": 0}, {"key": "35631314", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999387759842665, "res": {"Yes": 0.9999387759842665, "No": 6.102890216609664e-05}, "ground_truth": 0}, {"key": "35631314", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999701251202631, "res": {"Yes": 0.9999701251202631, "No": 2.9622451130484337e-05}, "ground_truth": 1}, {"key": "35631314", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999046864026295, "res": {"Yes": 0.9999046864026295, "No": 9.513838900422718e-05}, "ground_truth": 0}, {"key": "35631314", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999731051276736, "res": {"Yes": 0.9999731051276736, "No": 2.664121780329523e-05}, "ground_truth": 0}, {"key": "38082365", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9919824900622232, "res": {"Yes": 0.9919824900622232, "No": 0.008016931791023403}, "ground_truth": 0}, {"key": "38082365", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991978417011235, "res": {"Yes": 0.9991978417011235, "No": 0.0008014630404127906}, "ground_truth": 0}, {"key": "38082365", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9889789358687907, "res": {"Yes": 0.9889789358687907, "No": 0.011020523189755384}, "ground_truth": 1}, {"key": "38082365", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9950288880787758, "res": {"Yes": 0.9950288880787758, "No": 0.004970916745740967}, "ground_truth": 0}, {"key": "38082365", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9664438096460308, "res": {"Yes": 0.9664438096460308, "No": 0.03355583201902032}, "ground_truth": 0}, {"key": "37242829", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996100369353691, "res": {"Yes": 0.9996100369353691, "No": 0.0003891029875110613}, "ground_truth": 0}, {"key": "37242829", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.990331084474712, "res": {"Yes": 0.990331084474712, "No": 0.00965575083193965}, "ground_truth": 0}, {"key": "37242829", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9951670013046504, "res": {"Yes": 0.9951670013046504, "No": 0.004830240594656396}, "ground_truth": 1}, {"key": "37242829", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9985224139068429, "res": {"Yes": 0.9985224139068429, "No": 0.00145293882184245}, "ground_truth": 0}, {"key": "37242829", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9821881943972319, "res": {"Yes": 0.9821881943972319, "No": 0.017796036767256315}, "ground_truth": 0}, {"key": "38556068", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6464205828512181, "res": {"Yes": 0.6464205828512181, "No": 0.3535774580886653}, "ground_truth": 0}, {"key": "38556068", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997516845353897, "res": {"Yes": 0.9997516845353897, "No": 0.00024795730100246176}, "ground_truth": 0}, {"key": "38556068", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.996475405018659, "res": {"Yes": 0.996475405018659, "No": 0.0035235333507801577}, "ground_truth": 1}, {"key": "38556068", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997926665865435, "res": {"Yes": 0.9997926665865435, "No": 0.00020655248772827707}, "ground_truth": 0}, {"key": "38556068", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999254260847726, "res": {"Yes": 0.9999254260847726, "No": 7.382235196942103e-05}, "ground_truth": 0}, {"key": "32969336", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.009786714268188914, "res": {"No": 0.9902126707345448, "Yes": 0.009786714268188914}, "ground_truth": 0}, {"key": "32969336", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999238765575363, "res": {"Yes": 0.9999238765575363, "No": 7.595488593881515e-05}, "ground_truth": 0}, {"key": "32969336", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993936543718529, "res": {"Yes": 0.9993936543718529, "No": 0.0006060694345458935}, "ground_truth": 1}, {"key": "32969336", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997571555714829, "res": {"Yes": 0.9997571555714829, "No": 0.0002423070098747545}, "ground_truth": 0}, {"key": "32969336", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999058783297223, "res": {"Yes": 0.9999058783297223, "No": 9.385523650042908e-05}, "ground_truth": 0}, {"key": "36825153", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9539290169641955, "res": {"Yes": 0.9539290169641955, "No": 0.046070055285613906}, "ground_truth": 0}, {"key": "36825153", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9894737854639049, "res": {"Yes": 0.9894737854639049, "No": 0.010525493627904444}, "ground_truth": 0}, {"key": "36825153", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9787634859731446, "res": {"Yes": 0.9787634859731446, "No": 0.021236221370754288}, "ground_truth": 1}, {"key": "36825153", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99797456127495, "res": {"Yes": 0.99797456127495, "No": 0.002025396085039441}, "ground_truth": 0}, {"key": "36825153", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9799299602541282, "res": {"Yes": 0.9799299602541282, "No": 0.020069747444199044}, "ground_truth": 0}, {"key": "41050146", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5234346758155848, "res": {"Yes": 0.5234346758155848, "No": 0.476558163180082}, "ground_truth": 0}, {"key": "41050146", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9970892906525046, "res": {"Yes": 0.9970892906525046, "No": 0.0029101059195219287}, "ground_truth": 0}, {"key": "41050146", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997924224907163, "res": {"Yes": 0.997924224907163, "No": 0.002075149665393677}, "ground_truth": 1}, {"key": "41050146", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9964270026007337, "res": {"Yes": 0.9964270026007337, "No": 0.0035716725196498727}, "ground_truth": 0}, {"key": "41050146", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7250821066413699, "res": {"Yes": 0.7250821066413699, "No": 0.27491528041429447}, "ground_truth": 0}, {"key": "27865037", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9717102234423549, "res": {"Yes": 0.9717102234423549, "No": 0.028289261461526737}, "ground_truth": 0}, {"key": "27865037", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999914621674475, "res": {"Yes": 0.9999914621674475, "No": 8.467070304367985e-06}, "ground_truth": 0}, {"key": "27865037", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999437822452772, "res": {"Yes": 0.9999437822452772, "No": 5.6124843518209817e-05}, "ground_truth": 1}, {"key": "27865037", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999916486517445, "res": {"Yes": 0.999916486517445, "No": 8.345608438241603e-05}, "ground_truth": 0}, {"key": "27865037", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9980951962456861, "res": {"Yes": 0.9980951962456861, "No": 0.001904678597234457}, "ground_truth": 0}, {"key": "39868565", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9674348895166485, "res": {"Yes": 0.9674348895166485, "No": 0.03256385982108721}, "ground_truth": 0}, {"key": "39868565", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9462176314517213, "res": {"Yes": 0.9462176314517213, "No": 0.053780931915519636}, "ground_truth": 0}, {"key": "39868565", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4425904626769906, "res": {"No": 0.5574054758878701, "Yes": 0.4425904626769906}, "ground_truth": 1}, {"key": "39868565", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8443980604221587, "res": {"Yes": 0.8443980604221587, "No": 0.15559965258259664}, "ground_truth": 0}, {"key": "39868565", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.4273523074270459, "res": {"No": 0.5726399037761143, "Yes": 0.4273523074270459}, "ground_truth": 0}, {"key": "37761968", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9623982198712195, "res": {"Yes": 0.9623982198712195, "No": 0.03760044099743057}, "ground_truth": 0}, {"key": "37761968", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8843161186371158, "res": {"Yes": 0.8843161186371158, "No": 0.11568239698056558}, "ground_truth": 0}, {"key": "37761968", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997409589369314, "res": {"Yes": 0.9997409589369314, "No": 0.0002585992478957112}, "ground_truth": 1}, {"key": "37761968", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999040904456155, "res": {"Yes": 0.9999040904456155, "No": 9.582930711409745e-05}, "ground_truth": 0}, {"key": "37761968", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.996324511703853, "res": {"Yes": 0.996324511703853, "No": 0.00367462203215424}, "ground_truth": 0}, {"key": "16326139", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9398304916603916, "res": {"Yes": 0.9398304916603916, "No": 0.06016896446816098}, "ground_truth": 0}, {"key": "16326139", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9358668003028026, "res": {"Yes": 0.9358668003028026, "No": 0.06413268747663424}, "ground_truth": 0}, {"key": "16326139", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8746004722870284, "res": {"Yes": 0.8746004722870284, "No": 0.12539876491431023}, "ground_truth": 1}, {"key": "16326139", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.27257643739798515, "res": {"No": 0.7274211068568566, "Yes": 0.27257643739798515}, "ground_truth": 0}, {"key": "16326139", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9177356158546407, "res": {"Yes": 0.9177356158546407, "No": 0.082261794618531}, "ground_truth": 0}, {"key": "36568381", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996052706661307, "res": {"Yes": 0.9996052706661307, "No": 0.0003941775955881401}, "ground_truth": 0}, {"key": "36568381", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9944063301573843, "res": {"Yes": 0.9944063301573843, "No": 0.005590122935598358}, "ground_truth": 0}, {"key": "36568381", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9873746075161003, "res": {"Yes": 0.9873746075161003, "No": 0.012622630558111055}, "ground_truth": 1}, {"key": "36568381", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8604565401084486, "res": {"Yes": 0.8604565401084486, "No": 0.13953055073688328}, "ground_truth": 0}, {"key": "36568381", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999805776363853, "res": {"Yes": 0.999805776363853, "No": 0.00019334314391334525}, "ground_truth": 0}, {"key": "39855613", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9965049989839739, "res": {"Yes": 0.9965049989839739, "No": 0.003494576792645815}, "ground_truth": 0}, {"key": "39855613", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9939082977163044, "res": {"Yes": 0.9939082977163044, "No": 0.006087930952869267}, "ground_truth": 0}, {"key": "39855613", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7976069075127146, "res": {"Yes": 0.7976069075127146, "No": 0.202391811379181}, "ground_truth": 1}, {"key": "39855613", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9956809513340913, "res": {"Yes": 0.9956809513340913, "No": 0.004318292109148981}, "ground_truth": 0}, {"key": "39855613", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974019200667807, "res": {"Yes": 0.9974019200667807, "No": 0.00259697674734916}, "ground_truth": 0}, {"key": "29856302", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9917788797715805, "res": {"Yes": 0.9917788797715805, "No": 0.008220685329261}, "ground_truth": 0}, {"key": "29856302", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6441945514342237, "res": {"Yes": 0.6441945514342237, "No": 0.3558028121655064}, "ground_truth": 0}, {"key": "29856302", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9879542944326762, "res": {"Yes": 0.9879542944326762, "No": 0.012044134512510893}, "ground_truth": 1}, {"key": "29856302", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9919976248545296, "res": {"Yes": 0.9919976248545296, "No": 0.008000189900672266}, "ground_truth": 0}, {"key": "29856302", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9930270354255324, "res": {"Yes": 0.9930270354255324, "No": 0.0069699864378548375}, "ground_truth": 0}, {"key": "35641106", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7260078293404458, "res": {"Yes": 0.7260078293404458, "No": 0.2739902656636932}, "ground_truth": 0}, {"key": "35641106", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9958706616608699, "res": {"Yes": 0.9958706616608699, "No": 0.004128393214040948}, "ground_truth": 0}, {"key": "35641106", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998391812521558, "res": {"Yes": 0.998391812521558, "No": 0.0016077525610662796}, "ground_truth": 1}, {"key": "35641106", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993490140833357, "res": {"Yes": 0.9993490140833357, "No": 0.0006505903997684511}, "ground_truth": 0}, {"key": "35641106", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974856504852866, "res": {"Yes": 0.9974856504852866, "No": 0.0025135067231983293}, "ground_truth": 0}, {"key": "39474558", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9993572301650938, "res": {"Yes": 0.9993572301650938, "No": 0.0006427318180283648}, "ground_truth": 0}, {"key": "39474558", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989793810861355, "res": {"Yes": 0.9989793810861355, "No": 0.0010205169156567138}, "ground_truth": 0}, {"key": "39474558", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983162446092869, "res": {"Yes": 0.9983162446092869, "No": 0.0016836323609008507}, "ground_truth": 1}, {"key": "39474558", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9976320340651452, "res": {"Yes": 0.9976320340651452, "No": 0.0023679456833451363}, "ground_truth": 0}, {"key": "39474558", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8644430951738586, "res": {"Yes": 0.8644430951738586, "No": 0.13555566652016612}, "ground_truth": 0}, {"key": "34338135", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977543751965166, "res": {"Yes": 0.9977543751965166, "No": 0.00224494782184025}, "ground_truth": 0}, {"key": "34338135", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998157875691939, "res": {"Yes": 0.9998157875691939, "No": 0.0001837236190452922}, "ground_truth": 0}, {"key": "34338135", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996491065775022, "res": {"Yes": 0.9996491065775022, "No": 0.00035062695708457613}, "ground_truth": 1}, {"key": "34338135", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996841297975001, "res": {"Yes": 0.9996841297975001, "No": 0.0003148462920426795}, "ground_truth": 0}, {"key": "34338135", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9957155740527877, "res": {"Yes": 0.9957155740527877, "No": 0.0042830221874918225}, "ground_truth": 0}, {"key": "35870330", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9874100608252472, "res": {"Yes": 0.9874100608252472, "No": 0.01258860423573182}, "ground_truth": 0}, {"key": "35870330", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9826608457016826, "res": {"Yes": 0.9826608457016826, "No": 0.017338037355380007}, "ground_truth": 0}, {"key": "35870330", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8511816401500253, "res": {"Yes": 0.8511816401500253, "No": 0.1488142046175234}, "ground_truth": 1}, {"key": "35870330", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.935651248212518, "res": {"Yes": 0.935651248212518, "No": 0.06434650878159807}, "ground_truth": 0}, {"key": "35870330", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8611961878996865, "res": {"Yes": 0.8611961878996865, "No": 0.1387943830038874}, "ground_truth": 0}, {"key": "24478245", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9983755336760918, "res": {"Yes": 0.9983755336760918, "No": 0.0016242773009541923}, "ground_truth": 0}, {"key": "24478245", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9625007948522686, "res": {"Yes": 0.9625007948522686, "No": 0.03749844550743663}, "ground_truth": 0}, {"key": "24478245", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9723477315404779, "res": {"Yes": 0.9723477315404779, "No": 0.027651016184204166}, "ground_truth": 1}, {"key": "24478245", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99753962549511, "res": {"Yes": 0.99753962549511, "No": 0.0024602342745878437}, "ground_truth": 0}, {"key": "24478245", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9925567994433516, "res": {"Yes": 0.9925567994433516, "No": 0.0074425257888604745}, "ground_truth": 0}, {"key": "38485946", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 2.8851978168359078e-05, "res": {"No": 0.9999629731405111, "Yes": 2.8851978168359078e-05}, "ground_truth": 0}, {"key": "38485946", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6149597502901682, "res": {"Yes": 0.6149597502901682, "No": 0.3850155330206612}, "ground_truth": 0}, {"key": "38485946", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.01677484225072839, "res": {"No": 0.9832207031952128, "Yes": 0.01677484225072839}, "ground_truth": 1}, {"key": "38485946", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6237557210090962, "res": {"Yes": 0.6237557210090962, "No": 0.3762315126275046}, "ground_truth": 0}, {"key": "38485946", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.08126279445126505, "res": {"No": 0.9187269566195975, "Yes": 0.08126279445126505}, "ground_truth": 0}, {"key": "32509613", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8966282139899376, "res": {"Yes": 0.8966282139899376, "No": 0.1033714362742863}, "ground_truth": 0}, {"key": "32509613", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9953343262297011, "res": {"Yes": 0.9953343262297011, "No": 0.004665032397057893}, "ground_truth": 0}, {"key": "32509613", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9973026743376499, "res": {"Yes": 0.9973026743376499, "No": 0.0026970313793043417}, "ground_truth": 1}, {"key": "32509613", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9962124598929707, "res": {"Yes": 0.9962124598929707, "No": 0.003787197421692367}, "ground_truth": 0}, {"key": "32509613", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9913292804043033, "res": {"Yes": 0.9913292804043033, "No": 0.008670233990762066}, "ground_truth": 0}, {"key": "34078819", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.754969868349785, "res": {"Yes": 0.754969868349785, "No": 0.24502993309556798}, "ground_truth": 0}, {"key": "34078819", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9982019679997842, "res": {"Yes": 0.9982019679997842, "No": 0.0017977632961752173}, "ground_truth": 0}, {"key": "34078819", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.811548806722962, "res": {"Yes": 0.811548806722962, "No": 0.1884446404204572}, "ground_truth": 1}, {"key": "34078819", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9605639904239616, "res": {"Yes": 0.9605639904239616, "No": 0.03943558885302903}, "ground_truth": 0}, {"key": "34078819", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996385012564222, "res": {"Yes": 0.9996385012564222, "No": 0.0003613918974327721}, "ground_truth": 0}, {"key": "39523865", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9984273355348343, "res": {"Yes": 0.9984273355348343, "No": 0.0015723147222811776}, "ground_truth": 0}, {"key": "39523865", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994767712319385, "res": {"Yes": 0.9994767712319385, "No": 0.0005228029152529155}, "ground_truth": 0}, {"key": "39523865", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995695426233722, "res": {"Yes": 0.9995695426233722, "No": 0.00043021232159085455}, "ground_truth": 1}, {"key": "39523865", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996006308890822, "res": {"Yes": 0.9996006308890822, "No": 0.00039922395811886304}, "ground_truth": 0}, {"key": "39523865", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999058783297223, "res": {"Yes": 0.9999058783297223, "No": 9.384303611272636e-05}, "ground_truth": 0}, {"key": "33146158", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06145107187986058, "res": {"No": 0.9385484963217692, "Yes": 0.06145107187986058}, "ground_truth": 0}, {"key": "33146158", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9544886470692086, "res": {"Yes": 0.9544886470692086, "No": 0.045510873661743514}, "ground_truth": 0}, {"key": "33146158", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9360112250515622, "res": {"Yes": 0.9360112250515622, "No": 0.06398812242213708}, "ground_truth": 1}, {"key": "33146158", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9755871325456037, "res": {"Yes": 0.9755871325456037, "No": 0.024412445872160637}, "ground_truth": 0}, {"key": "33146158", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9939623522925803, "res": {"Yes": 0.9939623522925803, "No": 0.006035722580205386}, "ground_truth": 0}, {"key": "32083974", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6705810926660238, "res": {"Yes": 0.6705810926660238, "No": 0.3294173141270159}, "ground_truth": 0}, {"key": "32083974", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985213499817778, "res": {"Yes": 0.9985213499817778, "No": 0.0014782071657596266}, "ground_truth": 0}, {"key": "32083974", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9841294014867682, "res": {"Yes": 0.9841294014867682, "No": 0.015867637838138233}, "ground_truth": 1}, {"key": "32083974", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9970560020860143, "res": {"Yes": 0.9970560020860143, "No": 0.002943783265150366}, "ground_truth": 0}, {"key": "32083974", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9842726952539514, "res": {"Yes": 0.9842726952539514, "No": 0.01572543207225719}, "ground_truth": 0}, {"key": "34378482", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9974679741986955, "res": {"Yes": 0.9974679741986955, "No": 0.0025312341217955336}, "ground_truth": 0}, {"key": "34378482", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9571124708839487, "res": {"Yes": 0.9571124708839487, "No": 0.042884123634241766}, "ground_truth": 0}, {"key": "34378482", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.19626760879516444, "res": {"No": 0.8037253440852914, "Yes": 0.19626760879516444}, "ground_truth": 1}, {"key": "34378482", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9882090633875183, "res": {"Yes": 0.9882090633875183, "No": 0.01178896917972922}, "ground_truth": 0}, {"key": "34378482", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9524295166376227, "res": {"Yes": 0.9524295166376227, "No": 0.047569047112894024}, "ground_truth": 0}, {"key": "38080102", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9940844988849864, "res": {"Yes": 0.9940844988849864, "No": 0.005915191539979981}, "ground_truth": 0}, {"key": "38080102", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9884445075348713, "res": {"Yes": 0.9884445075348713, "No": 0.011555277730718334}, "ground_truth": 0}, {"key": "38080102", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980444969922774, "res": {"Yes": 0.9980444969922774, "No": 0.001953305916658866}, "ground_truth": 1}, {"key": "38080102", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988148800100264, "res": {"Yes": 0.9988148800100264, "No": 0.0011849939617235097}, "ground_truth": 0}, {"key": "38080102", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.736513244657106, "res": {"Yes": 0.736513244657106, "No": 0.2634738123000959}, "ground_truth": 0}, {"key": "40244537", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0533250274423704, "res": {"No": 0.9466736971080344, "Yes": 0.0533250274423704}, "ground_truth": 0}, {"key": "40244537", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.22151153812407862, "res": {"No": 0.7784842648897653, "Yes": 0.22151153812407862}, "ground_truth": 0}, {"key": "40244537", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9629845345213898, "res": {"Yes": 0.9629845345213898, "No": 0.03701307686482861}, "ground_truth": 1}, {"key": "40244537", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8044650472855416, "res": {"Yes": 0.8044650472855416, "No": 0.19553386344582036}, "ground_truth": 0}, {"key": "40244537", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.47624359569082, "res": {"No": 0.5237460759465573, "Yes": 0.47624359569082}, "ground_truth": 0}, {"key": "33497789", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.32555873113995704, "res": {"No": 0.6744350780036408, "Yes": 0.32555873113995704}, "ground_truth": 0}, {"key": "33497789", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.28279011488737693, "res": {"No": 0.7170899162778246, "Yes": 0.28279011488737693}, "ground_truth": 0}, {"key": "33497789", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.05000865442660412, "res": {"No": 0.9499904405662696, "Yes": 0.05000865442660412}, "ground_truth": 1}, {"key": "33497789", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.24323848431066303, "res": {"No": 0.7567530353911114, "Yes": 0.24323848431066303}, "ground_truth": 0}, {"key": "33497789", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.975283491240687, "res": {"Yes": 0.975283491240687, "No": 0.02471552228841528}, "ground_truth": 0}, {"key": "28816889", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9991784383367386, "res": {"Yes": 0.9991784383367386, "No": 0.0008214208280453691}, "ground_truth": 0}, {"key": "28816889", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9979810893472987, "res": {"Yes": 0.9979810893472987, "No": 0.00201867545094426}, "ground_truth": 0}, {"key": "28816889", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998683407378415, "res": {"Yes": 0.9998683407378415, "No": 0.00013156085996361876}, "ground_truth": 1}, {"key": "28816889", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999720323251027, "res": {"Yes": 0.9999720323251027, "No": 2.786921174917785e-05}, "ground_truth": 0}, {"key": "28816889", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999987886094374, "res": {"Yes": 0.999987886094374, "No": 1.2014912155962867e-05}, "ground_truth": 0}, {"key": "38157127", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0002076019528344041, "res": {"No": 0.9997914747944036, "Yes": 0.0002076019528344041}, "ground_truth": 0}, {"key": "38157127", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.00589577079212008, "res": {"No": 0.9941026460631514, "Yes": 0.00589577079212008}, "ground_truth": 0}, {"key": "38157127", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9916174521361811, "res": {"Yes": 0.9916174521361811, "No": 0.008381167955794553}, "ground_truth": 1}, {"key": "38157127", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9952724379668312, "res": {"Yes": 0.9952724379668312, "No": 0.004726504292131093}, "ground_truth": 0}, {"key": "38157127", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8790097053536077, "res": {"Yes": 0.8790097053536077, "No": 0.12098843699216047}, "ground_truth": 0}, {"key": "36183569", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.998057071234496, "res": {"Yes": 0.998057071234496, "No": 0.0019419629258513446}, "ground_truth": 0}, {"key": "36183569", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9918368152351681, "res": {"Yes": 0.9918368152351681, "No": 0.008162261530981913}, "ground_truth": 0}, {"key": "36183569", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9544040544891944, "res": {"Yes": 0.9544040544891944, "No": 0.04559459956807116}, "ground_truth": 1}, {"key": "36183569", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9981217962363528, "res": {"Yes": 0.9981217962363528, "No": 0.0018774316120425821}, "ground_truth": 0}, {"key": "36183569", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9896760931742197, "res": {"Yes": 0.9896760931742197, "No": 0.010323432165942843}, "ground_truth": 0}, {"key": "36012016", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9981682377280655, "res": {"Yes": 0.9981682377280655, "No": 0.0018311604269612219}, "ground_truth": 0}, {"key": "36012016", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999648749133035, "res": {"Yes": 0.999648749133035, "No": 0.0003505974004779223}, "ground_truth": 0}, {"key": "36012016", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993949648076534, "res": {"Yes": 0.9993949648076534, "No": 0.0006044334409057962}, "ground_truth": 1}, {"key": "36012016", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982665866992374, "res": {"Yes": 0.9982665866992374, "No": 0.0017322393249674056}, "ground_truth": 0}, {"key": "36012016", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975416433203053, "res": {"Yes": 0.9975416433203053, "No": 0.0024578753035096146}, "ground_truth": 0}, {"key": "34571973", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08235878081932897, "res": {"No": 0.9176372306932957, "Yes": 0.08235878081932897}, "ground_truth": 0}, {"key": "34571973", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9095006648665347, "res": {"Yes": 0.9095006648665347, "No": 0.09049526953263716}, "ground_truth": 0}, {"key": "34571973", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5487789443585973, "res": {"Yes": 0.5487789443585973, "No": 0.451204931100733}, "ground_truth": 1}, {"key": "34571973", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9935383059160815, "res": {"Yes": 0.9935383059160815, "No": 0.006460313066857799}, "ground_truth": 0}, {"key": "34571973", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9815024736438244, "res": {"Yes": 0.9815024736438244, "No": 0.018490268727904366}, "ground_truth": 0}, {"key": "38707498", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9960987839927583, "res": {"Yes": 0.9960987839927583, "No": 0.003900835180215136}, "ground_truth": 0}, {"key": "38707498", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.009872662550110427, "res": {"No": 0.9901259442803788, "Yes": 0.009872662550110427}, "ground_truth": 0}, {"key": "38707498", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9160522723975641, "res": {"Yes": 0.9160522723975641, "No": 0.0839414791262094}, "ground_truth": 1}, {"key": "38707498", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.02266321847838658, "res": {"No": 0.9773326771946675, "Yes": 0.02266321847838658}, "ground_truth": 0}, {"key": "38707498", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.06935218679402395, "res": {"No": 0.9306445298766799, "Yes": 0.06935218679402395}, "ground_truth": 0}, {"key": "35459082", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9950098906710847, "res": {"Yes": 0.9950098906710847, "No": 0.0049898770939150044}, "ground_truth": 0}, {"key": "35459082", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9677613387328935, "res": {"Yes": 0.9677613387328935, "No": 0.03223761630584586}, "ground_truth": 0}, {"key": "35459082", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9659651664455088, "res": {"Yes": 0.9659651664455088, "No": 0.034033736374776476}, "ground_truth": 1}, {"key": "35459082", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9673697349709435, "res": {"Yes": 0.9673697349709435, "No": 0.03262868074280853}, "ground_truth": 0}, {"key": "35459082", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9883969971145785, "res": {"Yes": 0.9883969971145785, "No": 0.01160278063130864}, "ground_truth": 0}, {"key": "39464041", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7126473366046608, "res": {"Yes": 0.7126473366046608, "No": 0.28733646441786276}, "ground_truth": 0}, {"key": "39464041", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.2869106602529582, "res": {"No": 0.7130667959474962, "Yes": 0.2869106602529582}, "ground_truth": 0}, {"key": "39464041", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9176527847761765, "res": {"Yes": 0.9176527847761765, "No": 0.0823441716674817}, "ground_truth": 1}, {"key": "39464041", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9648037270384905, "res": {"Yes": 0.9648037270384905, "No": 0.03519422402645067}, "ground_truth": 0}, {"key": "39464041", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8213625922092096, "res": {"Yes": 0.8213625922092096, "No": 0.17863442141897584}, "ground_truth": 0}, {"key": "23782052", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9768883557371714, "res": {"Yes": 0.9768883557371714, "No": 0.023103404300421564}, "ground_truth": 0}, {"key": "23782052", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9975097298800268, "res": {"Yes": 0.9975097298800268, "No": 0.0024891698939781834}, "ground_truth": 0}, {"key": "23782052", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.924114484538368, "res": {"Yes": 0.924114484538368, "No": 0.07588428991475644}, "ground_truth": 1}, {"key": "23782052", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9914993020063426, "res": {"Yes": 0.9914993020063426, "No": 0.008500201584020184}, "ground_truth": 0}, {"key": "23782052", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.965004287160164, "res": {"Yes": 0.965004287160164, "No": 0.03498800466825772}, "ground_truth": 0}, {"key": "36568455", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.955180192551368, "res": {"Yes": 0.955180192551368, "No": 0.04481878138807807}, "ground_truth": 0}, {"key": "36568455", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992754409197937, "res": {"Yes": 0.9992754409197937, "No": 0.0007241094521513664}, "ground_truth": 0}, {"key": "36568455", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999737011318213, "res": {"Yes": 0.9999737011318213, "No": 2.621229454031631e-05}, "ground_truth": 1}, {"key": "36568455", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997491818801253, "res": {"Yes": 0.9997491818801253, "No": 0.0002503746905312559}, "ground_truth": 0}, {"key": "36568455", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.995516465186398, "res": {"Yes": 0.995516465186398, "No": 0.00448180236430799}, "ground_truth": 0}, {"key": "38469552", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0003357289231364141, "res": {"No": 0.9996642365811576, "Yes": 0.0003357289231364141}, "ground_truth": 0}, {"key": "38469552", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994717709621076, "res": {"Yes": 0.9994717709621076, "No": 0.0005276470308411659}, "ground_truth": 0}, {"key": "38469552", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994834394633573, "res": {"Yes": 0.9994834394633573, "No": 0.0005162210978760316}, "ground_truth": 1}, {"key": "38469552", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.989911884866551, "res": {"Yes": 0.989911884866551, "No": 0.010086228504222618}, "ground_truth": 0}, {"key": "38469552", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8373485897376991, "res": {"Yes": 0.8373485897376991, "No": 0.16264912593145922}, "ground_truth": 0}, {"key": "35922277", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9594460071289372, "res": {"Yes": 0.9594460071289372, "No": 0.04055363337873006}, "ground_truth": 0}, {"key": "35922277", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.993948455503892, "res": {"Yes": 0.993948455503892, "No": 0.006051198060591533}, "ground_truth": 0}, {"key": "35922277", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984021484262983, "res": {"Yes": 0.9984021484262983, "No": 0.0015976927846924492}, "ground_truth": 1}, {"key": "35922277", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997009286607517, "res": {"Yes": 0.9997009286607517, "No": 0.000298894765910601}, "ground_truth": 0}, {"key": "35922277", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998864501472726, "res": {"Yes": 0.9998864501472726, "No": 0.00011337745454191715}, "ground_truth": 0}, {"key": "32744293", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8226063695693104, "res": {"Yes": 0.8226063695693104, "No": 0.177392178447952}, "ground_truth": 0}, {"key": "32744293", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6572496683334269, "res": {"Yes": 0.6572496683334269, "No": 0.342747587233479}, "ground_truth": 0}, {"key": "32744293", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9505853397718447, "res": {"Yes": 0.9505853397718447, "No": 0.04941305097020231}, "ground_truth": 1}, {"key": "32744293", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9735888711426722, "res": {"Yes": 0.9735888711426722, "No": 0.026410405467208964}, "ground_truth": 0}, {"key": "32744293", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.026837792953770517, "res": {"No": 0.9731515563537656, "Yes": 0.026837792953770517}, "ground_truth": 0}, {"key": "30972362", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.18851680968919893, "res": {"No": 0.8114818404784965, "Yes": 0.18851680968919893}, "ground_truth": 0}, {"key": "30972362", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7100989872519049, "res": {"Yes": 0.7100989872519049, "No": 0.28989833106631147}, "ground_truth": 0}, {"key": "30972362", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8464779636985059, "res": {"Yes": 0.8464779636985059, "No": 0.153517778164517}, "ground_truth": 1}, {"key": "30972362", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7982463419377506, "res": {"Yes": 0.7982463419377506, "No": 0.20175130569634703}, "ground_truth": 0}, {"key": "30972362", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9417907903454626, "res": {"Yes": 0.9417907903454626, "No": 0.058208243114742826}, "ground_truth": 0}, {"key": "36380943", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.833094481564938, "res": {"Yes": 0.833094481564938, "No": 0.166904197306442}, "ground_truth": 0}, {"key": "36380943", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985194455038231, "res": {"Yes": 0.9985194455038231, "No": 0.0014798744883073704}, "ground_truth": 0}, {"key": "36380943", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984033385223685, "res": {"Yes": 0.9984033385223685, "No": 0.001591599808071356}, "ground_truth": 1}, {"key": "36380943", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991232260510948, "res": {"Yes": 0.9991232260510948, "No": 0.0008758317076841944}, "ground_truth": 0}, {"key": "36380943", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.07918438172897822, "res": {"No": 0.9207761254152831, "Yes": 0.07918438172897822}, "ground_truth": 0}, {"key": "36929355", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7061015947002909, "res": {"Yes": 0.7061015947002909, "No": 0.2938970332582541}, "ground_truth": 0}, {"key": "36929355", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9931433081214067, "res": {"Yes": 0.9931433081214067, "No": 0.006856110366628051}, "ground_truth": 0}, {"key": "36929355", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9204486727944978, "res": {"Yes": 0.9204486727944978, "No": 0.07955034399072176}, "ground_truth": 1}, {"key": "36929355", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9340023076864279, "res": {"Yes": 0.9340023076864279, "No": 0.065995085622049}, "ground_truth": 0}, {"key": "36929355", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.07728541667376077, "res": {"No": 0.9227127374056062, "Yes": 0.07728541667376077}, "ground_truth": 0}, {"key": "39127206", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7895802214490373, "res": {"Yes": 0.7895802214490373, "No": 0.21039764313735038}, "ground_truth": 0}, {"key": "39127206", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6868440458680299, "res": {"Yes": 0.6868440458680299, "No": 0.3131206498293725}, "ground_truth": 0}, {"key": "39127206", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3083945528692554, "res": {"No": 0.6915953145455195, "Yes": 0.3083945528692554}, "ground_truth": 1}, {"key": "39127206", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2868487229277844, "res": {"No": 0.7131087255078149, "Yes": 0.2868487229277844}, "ground_truth": 0}, {"key": "39127206", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.2501096143035418, "res": {"No": 0.7498692432383811, "Yes": 0.2501096143035418}, "ground_truth": 0}, {"key": "36128318", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.960963756579847, "res": {"Yes": 0.960963756579847, "No": 0.03903389139870731}, "ground_truth": 0}, {"key": "36128318", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9270325599786988, "res": {"Yes": 0.9270325599786988, "No": 0.07296342432780055}, "ground_truth": 0}, {"key": "36128318", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9437202198902062, "res": {"Yes": 0.9437202198902062, "No": 0.05627603502997339}, "ground_truth": 1}, {"key": "36128318", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9906276884771726, "res": {"Yes": 0.9906276884771726, "No": 0.00937087316287824}, "ground_truth": 0}, {"key": "36128318", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9816892369786718, "res": {"Yes": 0.9816892369786718, "No": 0.018308899973659552}, "ground_truth": 0}, {"key": "39863480", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8537020958069412, "res": {"Yes": 0.8537020958069412, "No": 0.14629487534062782}, "ground_truth": 0}, {"key": "39863480", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9008644920188331, "res": {"Yes": 0.9008644920188331, "No": 0.09912793404698601}, "ground_truth": 0}, {"key": "39863480", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9924037980853089, "res": {"Yes": 0.9924037980853089, "No": 0.00759448844031555}, "ground_truth": 1}, {"key": "39863480", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9950699686944209, "res": {"Yes": 0.9950699686944209, "No": 0.0049279214125831534}, "ground_truth": 0}, {"key": "39863480", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8544118000086744, "res": {"Yes": 0.8544118000086744, "No": 0.1455788812645116}, "ground_truth": 0}, {"key": "38634057", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00809901119051982, "res": {"No": 0.9919001450457351, "Yes": 0.00809901119051982}, "ground_truth": 0}, {"key": "38634057", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.37944109939590964, "res": {"No": 0.6205561418660641, "Yes": 0.37944109939590964}, "ground_truth": 0}, {"key": "38634057", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6153968098326368, "res": {"Yes": 0.6153968098326368, "No": 0.38459899074456444}, "ground_truth": 1}, {"key": "38634057", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.23813508078309042, "res": {"No": 0.7618607673530089, "Yes": 0.23813508078309042}, "ground_truth": 0}, {"key": "38634057", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.03086984072566018, "res": {"No": 0.9691281229551176, "Yes": 0.03086984072566018}, "ground_truth": 0}, {"key": "33131935", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7095657824844355, "res": {"Yes": 0.7095657824844355, "No": 0.29042642644987926}, "ground_truth": 0}, {"key": "33131935", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9885233618637523, "res": {"Yes": 0.9885233618637523, "No": 0.011474019193751453}, "ground_truth": 0}, {"key": "33131935", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4381384380226359, "res": {"No": 0.5618602643225259, "Yes": 0.4381384380226359}, "ground_truth": 1}, {"key": "33131935", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.10963117516268475, "res": {"No": 0.8903644194550435, "Yes": 0.10963117516268475}, "ground_truth": 0}, {"key": "33131935", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9197506944089858, "res": {"Yes": 0.9197506944089858, "No": 0.08024192861793276}, "ground_truth": 0}, {"key": "39021319", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.972530125102656, "res": {"Yes": 0.972530125102656, "No": 0.02746947200076939}, "ground_truth": 0}, {"key": "39021319", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999361630584512, "res": {"Yes": 0.999361630584512, "No": 0.0006380248024893213}, "ground_truth": 0}, {"key": "39021319", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993567536716801, "res": {"Yes": 0.9993567536716801, "No": 0.0006430333299500395}, "ground_truth": 1}, {"key": "39021319", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994131811055954, "res": {"Yes": 0.9994131811055954, "No": 0.0005866772611411033}, "ground_truth": 0}, {"key": "39021319", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9955059476105025, "res": {"Yes": 0.9955059476105025, "No": 0.0044937555565024686}, "ground_truth": 0}, {"key": "40644571", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9962699557625339, "res": {"Yes": 0.9962699557625339, "No": 0.0037297651864589033}, "ground_truth": 0}, {"key": "40644571", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992818696191378, "res": {"Yes": 0.9992818696191378, "No": 0.0007179145551262681}, "ground_truth": 0}, {"key": "40644571", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995874083093709, "res": {"Yes": 0.9995874083093709, "No": 0.00041236156851159715}, "ground_truth": 1}, {"key": "40644571", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998762071829632, "res": {"Yes": 0.9998762071829632, "No": 0.00012361260944262077}, "ground_truth": 0}, {"key": "40644571", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998253184785939, "res": {"Yes": 0.9998253184785939, "No": 0.0001744499808683296}, "ground_truth": 0}, {"key": "14681877", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9990263609443913, "res": {"Yes": 0.9990263609443913, "No": 0.0009736104334367795}, "ground_truth": 0}, {"key": "14681877", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999152945777069, "res": {"Yes": 0.9999152945777069, "No": 8.45658531415421e-05}, "ground_truth": 0}, {"key": "14681877", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993941309128427, "res": {"Yes": 0.9993941309128427, "No": 0.0006056860956966888}, "ground_truth": 1}, {"key": "14681877", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997787264246095, "res": {"Yes": 0.9997787264246095, "No": 0.00022111911936591782}, "ground_truth": 0}, {"key": "14681877", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9986499628212162, "res": {"Yes": 0.9986499628212162, "No": 0.0013499887768645804}, "ground_truth": 0}, {"key": "36570890", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9989582067437867, "res": {"Yes": 0.9989582067437867, "No": 0.0010413014020368618}, "ground_truth": 0}, {"key": "36570890", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.36709452602158155, "res": {"No": 0.6328589370085906, "Yes": 0.36709452602158155}, "ground_truth": 0}, {"key": "36570890", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9894053914418199, "res": {"Yes": 0.9894053914418199, "No": 0.010575030181619652}, "ground_truth": 1}, {"key": "36570890", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9497557601699208, "res": {"Yes": 0.9497557601699208, "No": 0.05023297476997371}, "ground_truth": 0}, {"key": "36570890", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6131238219810828, "res": {"Yes": 0.6131238219810828, "No": 0.3868502158572049}, "ground_truth": 0}, {"key": "30452755", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9661336019854669, "res": {"Yes": 0.9661336019854669, "No": 0.03386559421117972}, "ground_truth": 0}, {"key": "30452755", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9744289323401537, "res": {"Yes": 0.9744289323401537, "No": 0.025568473252674834}, "ground_truth": 0}, {"key": "30452755", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9881102395171782, "res": {"Yes": 0.9881102395171782, "No": 0.011887498230077731}, "ground_truth": 1}, {"key": "30452755", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9388541703277452, "res": {"Yes": 0.9388541703277452, "No": 0.06114343387286567}, "ground_truth": 0}, {"key": "30452755", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9543517164059696, "res": {"Yes": 0.9543517164059696, "No": 0.04564761128661285}, "ground_truth": 0}, {"key": "37347053", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8839645225604568, "res": {"Yes": 0.8839645225604568, "No": 0.11603496626252871}, "ground_truth": 0}, {"key": "37347053", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995516736283152, "res": {"Yes": 0.9995516736283152, "No": 0.0004481551807160536}, "ground_truth": 0}, {"key": "37347053", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995422680912289, "res": {"Yes": 0.9995422680912289, "No": 0.00045613647771250253}, "ground_truth": 1}, {"key": "37347053", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9822737614488196, "res": {"Yes": 0.9822737614488196, "No": 0.01772516318709713}, "ground_truth": 0}, {"key": "37347053", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990725313651551, "res": {"Yes": 0.9990725313651551, "No": 0.0009261174458398341}, "ground_truth": 0}, {"key": "38890979", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00044741705025042993, "res": {"No": 0.9995515544817628, "Yes": 0.00044741705025042993}, "ground_truth": 0}, {"key": "38890979", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996986644806704, "res": {"Yes": 0.9996986644806704, "No": 0.00030093282225537795}, "ground_truth": 0}, {"key": "38890979", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9962071379409829, "res": {"Yes": 0.9962071379409829, "No": 0.0037925563066854512}, "ground_truth": 1}, {"key": "38890979", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999236765171988, "res": {"Yes": 0.999236765171988, "No": 0.0007628127268429224}, "ground_truth": 0}, {"key": "38890979", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989996068272273, "res": {"Yes": 0.9989996068272273, "No": 0.0010000312794713295}, "ground_truth": 0}, {"key": "32974694", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9916795749489402, "res": {"Yes": 0.9916795749489402, "No": 0.008319611665982827}, "ground_truth": 0}, {"key": "32974694", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9926251554120943, "res": {"Yes": 0.9926251554120943, "No": 0.007373041288728505}, "ground_truth": 0}, {"key": "32974694", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999776104528333, "res": {"Yes": 0.999776104528333, "No": 0.00022336418544606387}, "ground_truth": 1}, {"key": "32974694", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9948862163398127, "res": {"Yes": 0.9948862163398127, "No": 0.005112153678778015}, "ground_truth": 0}, {"key": "32974694", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993234169855787, "res": {"Yes": 0.9993234169855787, "No": 0.0006760642108281913}, "ground_truth": 0}, {"key": "38519940", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0014692752896414197, "res": {"No": 0.9985302587291516, "Yes": 0.0014692752896414197}, "ground_truth": 0}, {"key": "38519940", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9945626621253714, "res": {"Yes": 0.9945626621253714, "No": 0.005434033516895713}, "ground_truth": 0}, {"key": "38519940", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9946804710713109, "res": {"Yes": 0.9946804710713109, "No": 0.005318308379346621}, "ground_truth": 1}, {"key": "38519940", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9949465136440612, "res": {"Yes": 0.9949465136440612, "No": 0.00505230350545952}, "ground_truth": 0}, {"key": "38519940", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977057150042696, "res": {"Yes": 0.9977057150042696, "No": 0.0022940533596913313}, "ground_truth": 0}, {"key": "38870104", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.09092694473461552, "res": {"No": 0.9090722091053545, "Yes": 0.09092694473461552}, "ground_truth": 0}, {"key": "38870104", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.010530031093411647, "res": {"No": 0.9894661991974737, "Yes": 0.010530031093411647}, "ground_truth": 1}, {"key": "38870104", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06010166704332226, "res": {"No": 0.9398936767085633, "Yes": 0.06010166704332226}, "ground_truth": 0}, {"key": "38870104", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.018698667768231758, "res": {"No": 0.9813003972005764, "Yes": 0.018698667768231758}, "ground_truth": 0}, {"key": "34283161", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9398036420266107, "res": {"Yes": 0.9398036420266107, "No": 0.06019480656940569}, "ground_truth": 0}, {"key": "34283161", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.987683967850935, "res": {"Yes": 0.987683967850935, "No": 0.012314628676447873}, "ground_truth": 0}, {"key": "34283161", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997871158903295, "res": {"Yes": 0.997871158903295, "No": 0.002128222829231572}, "ground_truth": 1}, {"key": "34283161", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974220811545131, "res": {"Yes": 0.9974220811545131, "No": 0.0025758762795974406}, "ground_truth": 0}, {"key": "34283161", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9296636917592503, "res": {"Yes": 0.9296636917592503, "No": 0.07033545280218473}, "ground_truth": 0}, {"key": "31650463", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9882934778345001, "res": {"Yes": 0.9882934778345001, "No": 0.011705950227517858}, "ground_truth": 0}, {"key": "31650463", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9836533948376219, "res": {"Yes": 0.9836533948376219, "No": 0.016346188959024677}, "ground_truth": 0}, {"key": "31650463", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976210038075387, "res": {"Yes": 0.9976210038075387, "No": 0.0023775232129409126}, "ground_truth": 1}, {"key": "31650463", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9903264239875945, "res": {"Yes": 0.9903264239875945, "No": 0.009671924226653628}, "ground_truth": 0}, {"key": "31650463", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9958320116746473, "res": {"Yes": 0.9958320116746473, "No": 0.004167537271533303}, "ground_truth": 0}, {"key": "35589432", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6991868933676999, "res": {"Yes": 0.6991868933676999, "No": 0.3008117575712429}, "ground_truth": 0}, {"key": "35589432", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7852662238749917, "res": {"Yes": 0.7852662238749917, "No": 0.21472816492592614}, "ground_truth": 0}, {"key": "35589432", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.06286791756552407, "res": {"No": 0.93712987414872, "Yes": 0.06286791756552407}, "ground_truth": 1}, {"key": "35589432", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.48918865322032723, "res": {"No": 0.5108068932024841, "Yes": 0.48918865322032723}, "ground_truth": 0}, {"key": "35589432", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1416898308797673, "res": {"No": 0.8583049869588972, "Yes": 0.1416898308797673}, "ground_truth": 0}, {"key": "14412752", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9976129317893673, "res": {"Yes": 0.9976129317893673, "No": 0.002385825721726229}, "ground_truth": 0}, {"key": "14412752", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9904653270089055, "res": {"Yes": 0.9904653270089055, "No": 0.009530506640808456}, "ground_truth": 0}, {"key": "14412752", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9927876331563437, "res": {"Yes": 0.9927876331563437, "No": 0.007208123680798426}, "ground_truth": 1}, {"key": "14412752", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982259565786179, "res": {"Yes": 0.9982259565786179, "No": 0.0017736718316553972}, "ground_truth": 0}, {"key": "14412752", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971231929626972, "res": {"Yes": 0.9971231929626972, "No": 0.0028745886305400798}, "ground_truth": 0}, {"key": "37271183", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9949450972392125, "res": {"Yes": 0.9949450972392125, "No": 0.005054609903059309}, "ground_truth": 0}, {"key": "37271183", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9971114512082476, "res": {"Yes": 0.9971114512082476, "No": 0.0028884940576191357}, "ground_truth": 0}, {"key": "37271183", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9933827619862117, "res": {"Yes": 0.9933827619862117, "No": 0.006616088134048127}, "ground_truth": 1}, {"key": "37271183", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978960913250322, "res": {"Yes": 0.9978960913250322, "No": 0.0021036970123784818}, "ground_truth": 0}, {"key": "37271183", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977072574584974, "res": {"Yes": 0.9977072574584974, "No": 0.00229258678155615}, "ground_truth": 0}, {"key": "35588153", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9982834552510589, "res": {"Yes": 0.9982834552510589, "No": 0.0017163241451154483}, "ground_truth": 0}, {"key": "35588153", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989030065377292, "res": {"Yes": 0.9989030065377292, "No": 0.001096225131059213}, "ground_truth": 0}, {"key": "35588153", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994105638857601, "res": {"Yes": 0.9994105638857601, "No": 0.0005887740878058039}, "ground_truth": 1}, {"key": "35588153", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978646314502455, "res": {"Yes": 0.9978646314502455, "No": 0.0021347699283611765}, "ground_truth": 0}, {"key": "35588153", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9952021817765869, "res": {"Yes": 0.9952021817765869, "No": 0.00479700890545749}, "ground_truth": 0}, {"key": "39876692", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9960003778800204, "res": {"Yes": 0.9960003778800204, "No": 0.003999072578979325}, "ground_truth": 0}, {"key": "39876692", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986830096939099, "res": {"Yes": 0.9986830096939099, "No": 0.0013166587518611236}, "ground_truth": 0}, {"key": "39876692", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9989804527917904, "res": {"Yes": 0.9989804527917904, "No": 0.0010191289368683188}, "ground_truth": 1}, {"key": "39876692", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996543460520952, "res": {"Yes": 0.9996543460520952, "No": 0.0003455037710689681}, "ground_truth": 0}, {"key": "39876692", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982580336875899, "res": {"Yes": 0.9982580336875899, "No": 0.001741679676615831}, "ground_truth": 0}, {"key": "38992323", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8933203346644121, "res": {"Yes": 0.8933203346644121, "No": 0.10667600807370682}, "ground_truth": 0}, {"key": "38992323", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984774883985483, "res": {"Yes": 0.9984774883985483, "No": 0.0015198945827241035}, "ground_truth": 0}, {"key": "38992323", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.45067881727579584, "res": {"No": 0.549288211397916, "Yes": 0.45067881727579584}, "ground_truth": 1}, {"key": "38992323", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9966831937949912, "res": {"Yes": 0.9966831937949912, "No": 0.0033140674736531956}, "ground_truth": 0}, {"key": "38992323", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9709903839343941, "res": {"Yes": 0.9709903839343941, "No": 0.028993256804973007}, "ground_truth": 0}, {"key": "37556002", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5942079123923272, "res": {"Yes": 0.5942079123923272, "No": 0.40579158038274066}, "ground_truth": 0}, {"key": "37556002", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9945071223243295, "res": {"Yes": 0.9945071223243295, "No": 0.0054924569043965765}, "ground_truth": 0}, {"key": "37556002", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998845431116596, "res": {"Yes": 0.9998845431116596, "No": 0.00011518903459963412}, "ground_truth": 1}, {"key": "37556002", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988103628799458, "res": {"Yes": 0.9988103628799458, "No": 0.0011894997956692081}, "ground_truth": 0}, {"key": "37556002", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997543063676252, "res": {"Yes": 0.9997543063676252, "No": 0.00024551168871239307}, "ground_truth": 0}, {"key": "39875801", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 7.737106217244222e-08, "res": {"No": 0.9999998063873687, "Yes": 7.737106217244222e-08}, "ground_truth": 0}, {"key": "39875801", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999458907543352, "res": {"Yes": 0.999458907543352, "No": 0.0005399181521426864}, "ground_truth": 0}, {"key": "39875801", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995849060953229, "res": {"Yes": 0.9995849060953229, "No": 0.000414983001007595}, "ground_truth": 1}, {"key": "39875801", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996595892129042, "res": {"Yes": 0.9996595892129042, "No": 0.00033956685785510143}, "ground_truth": 0}, {"key": "39875801", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992749644254061, "res": {"Yes": 0.9992749644254061, "No": 0.0007249272159081688}, "ground_truth": 0}, {"key": "39272285", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.012748878143423972, "res": {"No": 0.9872496937702797, "Yes": 0.012748878143423972}, "ground_truth": 0}, {"key": "39272285", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9683921016826271, "res": {"Yes": 0.9683921016826271, "No": 0.031606938806809697}, "ground_truth": 0}, {"key": "39272285", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9932317340893211, "res": {"Yes": 0.9932317340893211, "No": 0.006767821710746536}, "ground_truth": 1}, {"key": "39272285", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9954993390657549, "res": {"Yes": 0.9954993390657549, "No": 0.004500174973328035}, "ground_truth": 0}, {"key": "39272285", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9729011061886634, "res": {"Yes": 0.9729011061886634, "No": 0.02709750017001972}, "ground_truth": 0}, {"key": "39629714", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9966557148208021, "res": {"Yes": 0.9966557148208021, "No": 0.0033439196906567435}, "ground_truth": 0}, {"key": "39629714", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9826331016470297, "res": {"Yes": 0.9826331016470297, "No": 0.01736660794817167}, "ground_truth": 0}, {"key": "39629714", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9510803557020229, "res": {"Yes": 0.9510803557020229, "No": 0.048918002547322176}, "ground_truth": 1}, {"key": "39629714", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9957388655064753, "res": {"Yes": 0.9957388655064753, "No": 0.004260537299546703}, "ground_truth": 0}, {"key": "39629714", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9627855899507337, "res": {"Yes": 0.9627855899507337, "No": 0.03721337646294648}, "ground_truth": 0}, {"key": "34043257", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08825107517118999, "res": {"No": 0.9117451123888101, "Yes": 0.08825107517118999}, "ground_truth": 0}, {"key": "34043257", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8152323209351277, "res": {"Yes": 0.8152323209351277, "No": 0.18476535690188683}, "ground_truth": 0}, {"key": "34043257", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7861687067135825, "res": {"Yes": 0.7861687067135825, "No": 0.21383072107459208}, "ground_truth": 1}, {"key": "34043257", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07553555548540893, "res": {"No": 0.9244616508296609, "Yes": 0.07553555548540893}, "ground_truth": 0}, {"key": "34043257", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9782471140607295, "res": {"Yes": 0.9782471140607295, "No": 0.021744193991556256}, "ground_truth": 0}, {"key": "33995240", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09805824893458709, "res": {"No": 0.9019402435048891, "Yes": 0.09805824893458709}, "ground_truth": 0}, {"key": "33995240", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997023586839678, "res": {"Yes": 0.9997023586839678, "No": 0.00029731897665818854}, "ground_truth": 0}, {"key": "33995240", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998594016848696, "res": {"Yes": 0.9998594016848696, "No": 0.00014036280824559856}, "ground_truth": 1}, {"key": "33995240", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999637428784835, "res": {"Yes": 0.999637428784835, "No": 0.0003623784319693009}, "ground_truth": 0}, {"key": "33995240", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.994333952341323, "res": {"Yes": 0.994333952341323, "No": 0.005664243118771437}, "ground_truth": 0}, {"key": "39399948", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9946947448384849, "res": {"Yes": 0.9946947448384849, "No": 0.0053044043186364674}, "ground_truth": 0}, {"key": "39399948", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985528341558492, "res": {"Yes": 0.9985528341558492, "No": 0.0014467610206750396}, "ground_truth": 0}, {"key": "39399948", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9989860459991053, "res": {"Yes": 0.9989860459991053, "No": 0.0010127867390653299}, "ground_truth": 1}, {"key": "39399948", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991673725267863, "res": {"Yes": 0.9991673725267863, "No": 0.0008300550782815128}, "ground_truth": 0}, {"key": "39399948", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9871739430330673, "res": {"Yes": 0.9871739430330673, "No": 0.012823401949712265}, "ground_truth": 0}, {"key": "33185890", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9440738924496328, "res": {"Yes": 0.9440738924496328, "No": 0.055925535294624205}, "ground_truth": 0}, {"key": "33185890", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9719971204753557, "res": {"Yes": 0.9719971204753557, "No": 0.028001673576607468}, "ground_truth": 0}, {"key": "33185890", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8583852765624636, "res": {"Yes": 0.8583852765624636, "No": 0.14161391964163184}, "ground_truth": 1}, {"key": "33185890", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9966546455094593, "res": {"Yes": 0.9966546455094593, "No": 0.0033451156901700904}, "ground_truth": 0}, {"key": "33185890", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9818204455677482, "res": {"Yes": 0.9818204455677482, "No": 0.01817896722776844}, "ground_truth": 0}, {"key": "35280425", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9957628515514547, "res": {"Yes": 0.9957628515514547, "No": 0.004236910207641371}, "ground_truth": 0}, {"key": "35280425", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9936989533808782, "res": {"Yes": 0.9936989533808782, "No": 0.006299628598131295}, "ground_truth": 0}, {"key": "35280425", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9964983723474145, "res": {"Yes": 0.9964983723474145, "No": 0.0035012928254159895}, "ground_truth": 1}, {"key": "35280425", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971093153978067, "res": {"Yes": 0.9971093153978067, "No": 0.0028902276740866376}, "ground_truth": 0}, {"key": "35280425", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9943120261273591, "res": {"Yes": 0.9943120261273591, "No": 0.005686609945785989}, "ground_truth": 0}, {"key": "16365170", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996792476720305, "res": {"Yes": 0.9996792476720305, "No": 0.00032066519031004624}, "ground_truth": 0}, {"key": "16365170", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988701869199327, "res": {"Yes": 0.9988701869199327, "No": 0.0011297352112997368}, "ground_truth": 0}, {"key": "16365170", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.993282425461005, "res": {"Yes": 0.993282425461005, "No": 0.006717212614533394}, "ground_truth": 1}, {"key": "16365170", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980557626827278, "res": {"Yes": 0.9980557626827278, "No": 0.0019440582682761537}, "ground_truth": 0}, {"key": "16365170", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981741650682937, "res": {"Yes": 0.9981741650682937, "No": 0.0018258000581212292}, "ground_truth": 0}, {"key": "24388238", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9993392494518504, "res": {"Yes": 0.9993392494518504, "No": 0.0006606101369897865}, "ground_truth": 0}, {"key": "24388238", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992980624335197, "res": {"Yes": 0.9992980624335197, "No": 0.0007018011894222869}, "ground_truth": 0}, {"key": "24388238", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9911463251654683, "res": {"Yes": 0.9911463251654683, "No": 0.008851587123963599}, "ground_truth": 1}, {"key": "24388238", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968633364402578, "res": {"Yes": 0.9968633364402578, "No": 0.003135570950837783}, "ground_truth": 0}, {"key": "24388238", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994424774734731, "res": {"Yes": 0.9994424774734731, "No": 0.0005573367068753755}, "ground_truth": 0}, {"key": "35024827", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09265590442526511, "res": {"No": 0.9073427881940984, "Yes": 0.09265590442526511}, "ground_truth": 0}, {"key": "35024827", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5659181401211053, "res": {"Yes": 0.5659181401211053, "No": 0.4340750211619969}, "ground_truth": 0}, {"key": "35024827", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980512452929581, "res": {"Yes": 0.9980512452929581, "No": 0.0019458293339790812}, "ground_truth": 1}, {"key": "35024827", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6487635749127213, "res": {"Yes": 0.6487635749127213, "No": 0.35122820854087744}, "ground_truth": 0}, {"key": "35024827", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.19915760157201806, "res": {"No": 0.8008390167121444, "Yes": 0.19915760157201806}, "ground_truth": 0}, {"key": "38624944", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7748672690797375, "res": {"Yes": 0.7748672690797375, "No": 0.2251296321039433}, "ground_truth": 0}, {"key": "38624944", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6608798273305087, "res": {"Yes": 0.6608798273305087, "No": 0.33910472364521926}, "ground_truth": 0}, {"key": "38624944", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9166863174511201, "res": {"Yes": 0.9166863174511201, "No": 0.0832956709956086}, "ground_truth": 1}, {"key": "38624944", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9692727935688529, "res": {"Yes": 0.9692727935688529, "No": 0.03072488089569128}, "ground_truth": 0}, {"key": "38624944", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9258812799061473, "res": {"Yes": 0.9258812799061473, "No": 0.07410855509281412}, "ground_truth": 0}, {"key": "34719830", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8525142111438049, "res": {"Yes": 0.8525142111438049, "No": 0.14747545851420268}, "ground_truth": 0}, {"key": "34719830", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9901811101890577, "res": {"Yes": 0.9901811101890577, "No": 0.00981770392643806}, "ground_truth": 0}, {"key": "34719830", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9382089158393185, "res": {"Yes": 0.9382089158393185, "No": 0.061788643100891355}, "ground_truth": 1}, {"key": "34719830", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5061652914969371, "res": {"Yes": 0.5061652914969371, "No": 0.4938254817601386}, "ground_truth": 0}, {"key": "34719830", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.44250876801822947, "res": {"No": 0.5574833174232927, "Yes": 0.44250876801822947}, "ground_truth": 0}, {"key": "38995225", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7391347009618715, "res": {"Yes": 0.7391347009618715, "No": 0.26082518117643816}, "ground_truth": 0}, {"key": "38995225", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9915030548383029, "res": {"Yes": 0.9915030548383029, "No": 0.008496145405888045}, "ground_truth": 0}, {"key": "38995225", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9928445087098653, "res": {"Yes": 0.9928445087098653, "No": 0.007154512517649241}, "ground_truth": 1}, {"key": "38995225", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971479620098678, "res": {"Yes": 0.9971479620098678, "No": 0.002850820589511413}, "ground_truth": 0}, {"key": "38995225", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9017186153164092, "res": {"Yes": 0.9017186153164092, "No": 0.09827643557966852}, "ground_truth": 0}, {"key": "34242311", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3320689669041074, "res": {"No": 0.6679302547188628, "Yes": 0.3320689669041074}, "ground_truth": 0}, {"key": "34242311", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984204435145674, "res": {"Yes": 0.9984204435145674, "No": 0.0015795242261178967}, "ground_truth": 0}, {"key": "34242311", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983770807600174, "res": {"Yes": 0.9983770807600174, "No": 0.0016228620353640746}, "ground_truth": 1}, {"key": "34242311", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9956085151928441, "res": {"Yes": 0.9956085151928441, "No": 0.004391165049386495}, "ground_truth": 0}, {"key": "34242311", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996426718769061, "res": {"Yes": 0.9996426718769061, "No": 0.0003571038221916934}, "ground_truth": 0}, {"key": "39253748", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.010469259316624234, "res": {"No": 0.9895295755476404, "Yes": 0.010469259316624234}, "ground_truth": 0}, {"key": "39253748", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8718910025165464, "res": {"Yes": 0.8718910025165464, "No": 0.12810864320875306}, "ground_truth": 0}, {"key": "39253748", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.837199069377614, "res": {"Yes": 0.837199069377614, "No": 0.16279822962697596}, "ground_truth": 1}, {"key": "39253748", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8376977028809516, "res": {"Yes": 0.8376977028809516, "No": 0.1622991080765671}, "ground_truth": 0}, {"key": "39253748", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.2241906215389018, "res": {"No": 0.7757939829001249, "Yes": 0.2241906215389018}, "ground_truth": 0}, {"key": "37131104", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 4.379070809637514e-06, "res": {"No": 0.9999947998470209, "Yes": 4.379070809637514e-06}, "ground_truth": 0}, {"key": "37131104", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995808548458833, "res": {"Yes": 0.9995808548458833, "No": 0.0004183510689787684}, "ground_truth": 0}, {"key": "37131104", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995338085810045, "res": {"Yes": 0.9995338085810045, "No": 0.0004652993481680478}, "ground_truth": 1}, {"key": "37131104", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9938498888334403, "res": {"Yes": 0.9938498888334403, "No": 0.00614897424810836}, "ground_truth": 0}, {"key": "37131104", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999038520625092, "res": {"Yes": 0.9999038520625092, "No": 9.513829386588564e-05}, "ground_truth": 0}, {"key": "38490554", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9783702205100235, "res": {"Yes": 0.9783702205100235, "No": 0.02162936709420115}, "ground_truth": 0}, {"key": "38490554", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9822575412961189, "res": {"Yes": 0.9822575412961189, "No": 0.01774211654551814}, "ground_truth": 0}, {"key": "38490554", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993525841641304, "res": {"Yes": 0.9993525841641304, "No": 0.0006467698793943832}, "ground_truth": 1}, {"key": "38490554", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986040720151285, "res": {"Yes": 0.9986040720151285, "No": 0.001395564899219668}, "ground_truth": 0}, {"key": "38490554", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999134648602662, "res": {"Yes": 0.999134648602662, "No": 0.0008599669497314662}, "ground_truth": 0}, {"key": "29009500", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.26373562448488136, "res": {"No": 0.736261385470063, "Yes": 0.26373562448488136}, "ground_truth": 0}, {"key": "29009500", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9965645497096947, "res": {"Yes": 0.9965645497096947, "No": 0.003434990908624409}, "ground_truth": 0}, {"key": "29009500", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9967424023226871, "res": {"Yes": 0.9967424023226871, "No": 0.003256911256713963}, "ground_truth": 1}, {"key": "29009500", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9656897230842306, "res": {"Yes": 0.9656897230842306, "No": 0.03431011741285603}, "ground_truth": 0}, {"key": "29009500", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.992400267615077, "res": {"Yes": 0.992400267615077, "No": 0.007599183284729161}, "ground_truth": 0}, {"key": "36703057", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9526375051865045, "res": {"Yes": 0.9526375051865045, "No": 0.047361590773642104}, "ground_truth": 0}, {"key": "36703057", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.560469272253701, "res": {"Yes": 0.560469272253701, "No": 0.43952652983679696}, "ground_truth": 0}, {"key": "36703057", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4534892564523808, "res": {"No": 0.5465077119156824, "Yes": 0.4534892564523808}, "ground_truth": 1}, {"key": "36703057", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.963423174659578, "res": {"Yes": 0.963423174659578, "No": 0.03657312492374388}, "ground_truth": 0}, {"key": "36703057", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.35251094766725777, "res": {"No": 0.647469636463916, "Yes": 0.35251094766725777}, "ground_truth": 0}, {"key": "34876987", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.01704869700784807, "res": {"No": 0.9829507714474979, "Yes": 0.01704869700784807}, "ground_truth": 0}, {"key": "34876987", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8738629442347305, "res": {"Yes": 0.8738629442347305, "No": 0.12612069924971994}, "ground_truth": 0}, {"key": "34876987", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9766814590195735, "res": {"Yes": 0.9766814590195735, "No": 0.023316472358938307}, "ground_truth": 1}, {"key": "34876987", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.988578587263932, "res": {"Yes": 0.988578587263932, "No": 0.011418680777896996}, "ground_truth": 0}, {"key": "34876987", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1590016817140365, "res": {"No": 0.8409897222095305, "Yes": 0.1590016817140365}, "ground_truth": 0}, {"key": "36209258", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9985506988527517, "res": {"Yes": 0.9985506988527517, "No": 0.001448911781253162}, "ground_truth": 0}, {"key": "36209258", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994886817677452, "res": {"Yes": 0.9994886817677452, "No": 0.0005109693244464212}, "ground_truth": 0}, {"key": "36209258", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994953501385975, "res": {"Yes": 0.9994953501385975, "No": 0.0005042515032370193}, "ground_truth": 1}, {"key": "36209258", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991084688502581, "res": {"Yes": 0.9991084688502581, "No": 0.0008907315202275176}, "ground_truth": 0}, {"key": "36209258", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996607808478312, "res": {"Yes": 0.9996607808478312, "No": 0.0003386112038719674}, "ground_truth": 0}, {"key": "36854437", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9223311731051327, "res": {"Yes": 0.9223311731051327, "No": 0.077665370738045}, "ground_truth": 0}, {"key": "36854437", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9982675351527719, "res": {"Yes": 0.9982675351527719, "No": 0.0017323074033106078}, "ground_truth": 0}, {"key": "36854437", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998795371462323, "res": {"Yes": 0.9998795371462323, "No": 0.00012021328714509226}, "ground_truth": 1}, {"key": "36854437", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999253068846696, "res": {"Yes": 0.9999253068846696, "No": 7.433185226922671e-05}, "ground_truth": 0}, {"key": "36854437", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977970979579989, "res": {"Yes": 0.9977970979579989, "No": 0.0022027720258863265}, "ground_truth": 0}, {"key": "38047723", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.003763006650622335, "res": {"No": 0.9962357627704026, "Yes": 0.003763006650622335}, "ground_truth": 0}, {"key": "38047723", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9168116462042305, "res": {"Yes": 0.9168116462042305, "No": 0.0831863755477547}, "ground_truth": 0}, {"key": "38047723", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8832971427332083, "res": {"Yes": 0.8832971427332083, "No": 0.11669462488557009}, "ground_truth": 1}, {"key": "38047723", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.986508858335726, "res": {"Yes": 0.986508858335726, "No": 0.013486789880211097}, "ground_truth": 0}, {"key": "38047723", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.962102283657623, "res": {"Yes": 0.962102283657623, "No": 0.03789496595962437}, "ground_truth": 0}, {"key": "34287816", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9324669877196978, "res": {"Yes": 0.9324669877196978, "No": 0.06753171092092378}, "ground_truth": 0}, {"key": "34287816", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9426678022354638, "res": {"Yes": 0.9426678022354638, "No": 0.05733160710063069}, "ground_truth": 0}, {"key": "34287816", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9695916310957251, "res": {"Yes": 0.9695916310957251, "No": 0.030408107866343435}, "ground_truth": 1}, {"key": "34287816", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9893946534833762, "res": {"Yes": 0.9893946534833762, "No": 0.010604243794651491}, "ground_truth": 0}, {"key": "34287816", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6353297204800075, "res": {"Yes": 0.6353297204800075, "No": 0.3646652388785092}, "ground_truth": 0}, {"key": "33235855", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9882930148191141, "res": {"Yes": 0.9882930148191141, "No": 0.011706523833132226}, "ground_truth": 0}, {"key": "33235855", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998776374469079, "res": {"Yes": 0.9998776374469079, "No": 0.00012203910888130622}, "ground_truth": 0}, {"key": "33235855", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9973522255546627, "res": {"Yes": 0.9973522255546627, "No": 0.0026474297905248302}, "ground_truth": 1}, {"key": "33235855", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999050439846079, "res": {"Yes": 0.9999050439846079, "No": 9.476930386783199e-05}, "ground_truth": 0}, {"key": "33235855", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974981063658707, "res": {"Yes": 0.9974981063658707, "No": 0.002501353233886234}, "ground_truth": 0}, {"key": "34381016", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8908943261036275, "res": {"Yes": 0.8908943261036275, "No": 0.10910506084558913}, "ground_truth": 0}, {"key": "34381016", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.00684341775745288, "res": {"No": 0.9931554219614717, "Yes": 0.00684341775745288}, "ground_truth": 0}, {"key": "34381016", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9641441522710844, "res": {"Yes": 0.9641441522710844, "No": 0.03585425607554229}, "ground_truth": 1}, {"key": "34381016", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.983773703004505, "res": {"Yes": 0.983773703004505, "No": 0.01622548702326924}, "ground_truth": 0}, {"key": "34381016", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9365314267495636, "res": {"Yes": 0.9365314267495636, "No": 0.06346537483440871}, "ground_truth": 0}, {"key": "28064995", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.005303544014028575, "res": {"No": 0.9946962796536603, "Yes": 0.005303544014028575}, "ground_truth": 0}, {"key": "28064995", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996229023192102, "res": {"Yes": 0.9996229023192102, "No": 0.00037651544085432696}, "ground_truth": 0}, {"key": "28064995", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996486299449218, "res": {"Yes": 0.9996486299449218, "No": 0.00035126539819486214}, "ground_truth": 1}, {"key": "28064995", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986752789186538, "res": {"Yes": 0.9986752789186538, "No": 0.0013245881474175116}, "ground_truth": 0}, {"key": "28064995", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995770419519847, "res": {"Yes": 0.9995770419519847, "No": 0.000422400137521729}, "ground_truth": 0}, {"key": "37576197", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0005979176036772301, "res": {"No": 0.9994015134345732, "Yes": 0.0005979176036772301}, "ground_truth": 0}, {"key": "37576197", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.3278249834660315, "res": {"No": 0.67215813244708, "Yes": 0.3278249834660315}, "ground_truth": 0}, {"key": "37576197", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.863613144386937, "res": {"Yes": 0.863613144386937, "No": 0.13636693158847837}, "ground_truth": 1}, {"key": "37576197", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9925856975597069, "res": {"Yes": 0.9925856975597069, "No": 0.007411491336038347}, "ground_truth": 0}, {"key": "37576197", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.20096984641754895, "res": {"No": 0.7990007216698, "Yes": 0.20096984641754895}, "ground_truth": 0}, {"key": "34454741", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9274940960180481, "res": {"Yes": 0.9274940960180481, "No": 0.07250216902375464}, "ground_truth": 0}, {"key": "34454741", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9965682210602584, "res": {"Yes": 0.9965682210602584, "No": 0.003431376796316667}, "ground_truth": 0}, {"key": "34454741", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9949330620581296, "res": {"Yes": 0.9949330620581296, "No": 0.005064701889364042}, "ground_truth": 1}, {"key": "34454741", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996835339659427, "res": {"Yes": 0.9996835339659427, "No": 0.00031628463693965267}, "ground_truth": 0}, {"key": "34454741", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985736391210275, "res": {"Yes": 0.9985736391210275, "No": 0.00142608977949388}, "ground_truth": 0}, {"key": "34766970", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.993057601566006, "res": {"Yes": 0.993057601566006, "No": 0.006941756073113964}, "ground_truth": 0}, {"key": "34766970", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995289234913968, "res": {"Yes": 0.9995289234913968, "No": 0.00047079631957217997}, "ground_truth": 0}, {"key": "34766970", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9959636042329507, "res": {"Yes": 0.9959636042329507, "No": 0.004036151661566202}, "ground_truth": 1}, {"key": "34766970", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999018257994022, "res": {"Yes": 0.9999018257994022, "No": 9.782171214407023e-05}, "ground_truth": 0}, {"key": "34766970", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9954270419588347, "res": {"Yes": 0.9954270419588347, "No": 0.004572246588552222}, "ground_truth": 0}, {"key": "35574186", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2989367399648146, "res": {"No": 0.7010614326869241, "Yes": 0.2989367399648146}, "ground_truth": 0}, {"key": "35574186", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9831194199650686, "res": {"Yes": 0.9831194199650686, "No": 0.01687104061459076}, "ground_truth": 0}, {"key": "35574186", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.18810704309905155, "res": {"No": 0.8118799455981243, "Yes": 0.18810704309905155}, "ground_truth": 1}, {"key": "35574186", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9928215870740064, "res": {"Yes": 0.9928215870740064, "No": 0.007176130275905736}, "ground_truth": 0}, {"key": "35574186", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.02240789784270604, "res": {"No": 0.9775824625654608, "Yes": 0.02240789784270604}, "ground_truth": 0}, {"key": "35486470", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00015274098189286262, "res": {"No": 0.9998468908124082, "Yes": 0.00015274098189286262}, "ground_truth": 0}, {"key": "35486470", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9192749476811182, "res": {"Yes": 0.9192749476811182, "No": 0.08071975000544429}, "ground_truth": 0}, {"key": "35486470", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.40910345856515884, "res": {"No": 0.590891497382741, "Yes": 0.40910345856515884}, "ground_truth": 1}, {"key": "35486470", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9875950042490103, "res": {"Yes": 0.9875950042490103, "No": 0.012403327445369641}, "ground_truth": 0}, {"key": "35486470", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.15465689442764133, "res": {"No": 0.8453387621601582, "Yes": 0.15465689442764133}, "ground_truth": 0}, {"key": "40977702", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.012974145623474834, "res": {"No": 0.987025613523864, "Yes": 0.012974145623474834}, "ground_truth": 0}, {"key": "40977702", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8743714793907038, "res": {"Yes": 0.8743714793907038, "No": 0.12562110570656662}, "ground_truth": 0}, {"key": "40977702", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.09168159763104022, "res": {"No": 0.9082912517270358, "Yes": 0.09168159763104022}, "ground_truth": 1}, {"key": "40977702", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.29868278156442757, "res": {"No": 0.7012867199157016, "Yes": 0.29868278156442757}, "ground_truth": 0}, {"key": "40977702", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.22603733369772613, "res": {"No": 0.7738771259480087, "Yes": 0.22603733369772613}, "ground_truth": 0}, {"key": "35336618", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 3.30492395833284e-05, "res": {"No": 0.9999669067235946, "Yes": 3.30492395833284e-05}, "ground_truth": 0}, {"key": "35336618", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9860800332981512, "res": {"Yes": 0.9860800332981512, "No": 0.013919000914991573}, "ground_truth": 0}, {"key": "35336618", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9824175601534278, "res": {"Yes": 0.9824175601534278, "No": 0.017582011033642944}, "ground_truth": 1}, {"key": "35336618", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9943951312163555, "res": {"Yes": 0.9943951312163555, "No": 0.005604601064074976}, "ground_truth": 0}, {"key": "35336618", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990700377831359, "res": {"Yes": 0.9990700377831359, "No": 0.0009293570081710504}, "ground_truth": 0}, {"key": "33024679", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977434551339649, "res": {"Yes": 0.9977434551339649, "No": 0.0022563766601412633}, "ground_truth": 0}, {"key": "33024679", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997533529623831, "res": {"Yes": 0.9997533529623831, "No": 0.0002465795249699727}, "ground_truth": 0}, {"key": "33024679", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986800372182235, "res": {"Yes": 0.9986800372182235, "No": 0.0013198938002190398}, "ground_truth": 1}, {"key": "33024679", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9954708681917931, "res": {"Yes": 0.9954708681917931, "No": 0.004528425371610906}, "ground_truth": 0}, {"key": "33024679", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993593744482288, "res": {"Yes": 0.9993593744482288, "No": 0.0006399048912983822}, "ground_truth": 0}, {"key": "37451334", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9982904652220936, "res": {"Yes": 0.9982904652220936, "No": 0.001709168985470468}, "ground_truth": 0}, {"key": "37451334", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990766997042659, "res": {"Yes": 0.9990766997042659, "No": 0.0009231198348334106}, "ground_truth": 0}, {"key": "37451334", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9941530741929734, "res": {"Yes": 0.9941530741929734, "No": 0.0058465706693170815}, "ground_truth": 1}, {"key": "37451334", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992953226617778, "res": {"Yes": 0.9992953226617778, "No": 0.0007041620807265094}, "ground_truth": 0}, {"key": "37451334", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9949597272184721, "res": {"Yes": 0.9949597272184721, "No": 0.005039263190233501}, "ground_truth": 0}, {"key": "33354824", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9895225706925688, "res": {"Yes": 0.9895225706925688, "No": 0.010477296509700366}, "ground_truth": 0}, {"key": "33354824", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999433054571963, "res": {"Yes": 0.9999433054571963, "No": 5.646627503862622e-05}, "ground_truth": 0}, {"key": "33354824", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999099308804668, "res": {"Yes": 0.9999099308804668, "No": 8.998685084771111e-05}, "ground_truth": 1}, {"key": "33354824", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986996580781836, "res": {"Yes": 0.9986996580781836, "No": 0.0013001997142081476}, "ground_truth": 0}, {"key": "33354824", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999265568886651, "res": {"Yes": 0.999265568886651, "No": 0.0007343696836081856}, "ground_truth": 0}, {"key": "34688538", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0041574956217273785, "res": {"No": 0.9958420612636845, "Yes": 0.0041574956217273785}, "ground_truth": 0}, {"key": "34688538", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.003850393223207144, "res": {"No": 0.9961451403212784, "Yes": 0.003850393223207144}, "ground_truth": 0}, {"key": "34688538", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.008904789508239546, "res": {"No": 0.9910929241356649, "Yes": 0.008904789508239546}, "ground_truth": 1}, {"key": "34688538", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.35702456144616146, "res": {"No": 0.6429611477345657, "Yes": 0.35702456144616146}, "ground_truth": 0}, {"key": "34688538", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.15485007317638624, "res": {"No": 0.8451460046354597, "Yes": 0.15485007317638624}, "ground_truth": 0}, {"key": "33646276", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4435847952078133, "res": {"No": 0.5564097142350372, "Yes": 0.4435847952078133}, "ground_truth": 0}, {"key": "33646276", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.06884159074823402, "res": {"No": 0.9311482192747467, "Yes": 0.06884159074823402}, "ground_truth": 0}, {"key": "33646276", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9809654246921723, "res": {"Yes": 0.9809654246921723, "No": 0.01903240549975931}, "ground_truth": 1}, {"key": "33646276", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4387327593074001, "res": {"No": 0.5612611913948614, "Yes": 0.4387327593074001}, "ground_truth": 0}, {"key": "33646276", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9980555246464567, "res": {"Yes": 0.9980555246464567, "No": 0.0019432638940033485}, "ground_truth": 0}, {"key": "40322608", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 8.809709495234778e-05, "res": {"No": 0.9999112420092235, "Yes": 8.809709495234778e-05}, "ground_truth": 0}, {"key": "40322608", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980421211501801, "res": {"Yes": 0.9980421211501801, "No": 0.0019576725222715027}, "ground_truth": 0}, {"key": "40322608", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9949213795232105, "res": {"Yes": 0.9949213795232105, "No": 0.005078009118571014}, "ground_truth": 1}, {"key": "40322608", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2374076199041662, "res": {"No": 0.762590491625922, "Yes": 0.2374076199041662}, "ground_truth": 0}, {"key": "40322608", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9439896442225871, "res": {"Yes": 0.9439896442225871, "No": 0.056009144888437404}, "ground_truth": 0}, {"key": "39565762", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977702762353725, "res": {"Yes": 0.9977702762353725, "No": 0.0022291373654177654}, "ground_truth": 0}, {"key": "39565762", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994878477947371, "res": {"Yes": 0.9994878477947371, "No": 0.0005114506286037667}, "ground_truth": 0}, {"key": "39565762", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999273332003598, "res": {"Yes": 0.9999273332003598, "No": 7.245705619095769e-05}, "ground_truth": 1}, {"key": "39565762", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988152334906749, "res": {"Yes": 0.9988152334906749, "No": 0.0011844520694256333}, "ground_truth": 0}, {"key": "39565762", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995247570437253, "res": {"Yes": 0.9995247570437253, "No": 0.0004747980510586158}, "ground_truth": 0}, {"key": "30534259", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 2.4309050849757154e-07, "res": {"No": 0.9999995679800934, "Yes": 2.4309050849757154e-07}, "ground_truth": 0}, {"key": "30534259", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974057136921982, "res": {"Yes": 0.9974057136921982, "No": 0.002593798176721698}, "ground_truth": 0}, {"key": "30534259", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9979544933060679, "res": {"Yes": 0.9979544933060679, "No": 0.0020448803495021163}, "ground_truth": 1}, {"key": "30534259", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997614458585652, "res": {"Yes": 0.9997614458585652, "No": 0.0002381678216021433}, "ground_truth": 0}, {"key": "30534259", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9822404138206976, "res": {"Yes": 0.9822404138206976, "No": 0.017756972913589446}, "ground_truth": 0}, {"key": "39644242", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8821678808395387, "res": {"Yes": 0.8821678808395387, "No": 0.11782885366777529}, "ground_truth": 0}, {"key": "39644242", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9969319330661679, "res": {"Yes": 0.9969319330661679, "No": 0.003066676123040019}, "ground_truth": 0}, {"key": "39644242", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9713616470394251, "res": {"Yes": 0.9713616470394251, "No": 0.028637678446618225}, "ground_truth": 1}, {"key": "39644242", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996326733809481, "res": {"Yes": 0.9996326733809481, "No": 0.00036659810195492165}, "ground_truth": 0}, {"key": "39644242", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999366276487621, "res": {"Yes": 0.999366276487621, "No": 0.0006333960247052306}, "ground_truth": 0}, {"key": "19853740", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9972741007288741, "res": {"Yes": 0.9972741007288741, "No": 0.0027245219430509482}, "ground_truth": 0}, {"key": "19853740", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9583352379449054, "res": {"Yes": 0.9583352379449054, "No": 0.041629725982885606}, "ground_truth": 0}, {"key": "19853740", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6719112873805568, "res": {"Yes": 0.6719112873805568, "No": 0.32808606884661545}, "ground_truth": 1}, {"key": "19853740", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9323970180222353, "res": {"Yes": 0.9323970180222353, "No": 0.06759906009161988}, "ground_truth": 0}, {"key": "19853740", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9822830832710477, "res": {"Yes": 0.9822830832710477, "No": 0.017715594182839776}, "ground_truth": 0}, {"key": "33023078", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1063596928973577, "res": {"No": 0.8936389450332077, "Yes": 0.1063596928973577}, "ground_truth": 0}, {"key": "33023078", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9089774432673103, "res": {"Yes": 0.9089774432673103, "No": 0.0910215761517958}, "ground_truth": 0}, {"key": "33023078", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9928931574955137, "res": {"Yes": 0.9928931574955137, "No": 0.007106581162273544}, "ground_truth": 1}, {"key": "33023078", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989572540377992, "res": {"Yes": 0.9989572540377992, "No": 0.0010425089700122885}, "ground_truth": 0}, {"key": "33023078", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9935028877016254, "res": {"Yes": 0.9935028877016254, "No": 0.006496829437041977}, "ground_truth": 0}, {"key": "38329806", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8443031216418031, "res": {"Yes": 0.8443031216418031, "No": 0.15569615427963268}, "ground_truth": 0}, {"key": "38329806", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.960002148021848, "res": {"Yes": 0.960002148021848, "No": 0.03999731308497598}, "ground_truth": 0}, {"key": "38329806", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0419341729889715, "res": {"No": 0.9580651088612099, "Yes": 0.0419341729889715}, "ground_truth": 1}, {"key": "38329806", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9812157980337427, "res": {"Yes": 0.9812157980337427, "No": 0.018782554351392537}, "ground_truth": 0}, {"key": "38329806", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999404447334853, "res": {"Yes": 0.9999404447334853, "No": 5.950554836073066e-05}, "ground_truth": 0}, {"key": "38761942", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9876470987904132, "res": {"Yes": 0.9876470987904132, "No": 0.012352467973027593}, "ground_truth": 0}, {"key": "38761942", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9972825155637826, "res": {"Yes": 0.9972825155637826, "No": 0.002717340593323537}, "ground_truth": 0}, {"key": "38761942", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9989017077648844, "res": {"Yes": 0.9989017077648844, "No": 0.0010981111626392182}, "ground_truth": 1}, {"key": "38761942", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997023586839678, "res": {"Yes": 0.9997023586839678, "No": 0.00029752330497389255}, "ground_truth": 0}, {"key": "38761942", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9958629891045004, "res": {"Yes": 0.9958629891045004, "No": 0.004136716176383808}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9813249574942637, "res": {"Yes": 0.9813249574942637, "No": 0.018674758122280213}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996299326918046, "res": {"Yes": 0.9996299326918046, "No": 0.00036995469713429346}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9568312551343084, "res": {"Yes": 0.9568312551343084, "No": 0.043168233062795935}, "ground_truth": 1}, {"key": "33773576", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994635539386676, "res": {"Yes": 0.9994635539386676, "No": 0.0005361728325937496}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975590757123475, "res": {"Yes": 0.9975590757123475, "No": 0.0024401679745935365}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9944892058432051, "res": {"Yes": 0.9944892058432051, "No": 0.005510532599292393}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994989207821441, "res": {"Yes": 0.9994989207821441, "No": 0.0005007322654607871}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995269016763211, "res": {"Yes": 0.9995269016763211, "No": 0.000472500997462953}, "ground_truth": 1}, {"key": "37642631", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999732620532263, "res": {"Yes": 0.999732620532263, "No": 0.00026684782656478685}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998598784379432, "res": {"Yes": 0.9998598784379432, "No": 0.00013945285092971068}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9044883267310959, "res": {"Yes": 0.9044883267310959, "No": 0.09551108165071352}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999855020530962, "res": {"Yes": 0.9999855020530962, "No": 1.4197665617569486e-05}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999965878943212, "res": {"Yes": 0.9999965878943212, "No": 3.106499588210657e-06}, "ground_truth": 1}, {"key": "36609836", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999452126088839, "res": {"Yes": 0.9999452126088839, "No": 5.4499937668117265e-05}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999953079650794, "res": {"Yes": 0.999953079650794, "No": 4.679407339119899e-05}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8454261662530548, "res": {"Yes": 0.8454261662530548, "No": 0.15457262938448826}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9695483805169132, "res": {"Yes": 0.9695483805169132, "No": 0.03044946666762945}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.96537976422688, "res": {"Yes": 0.96537976422688, "No": 0.03461825966982787}, "ground_truth": 1}, {"key": "41035610", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975132899986058, "res": {"Yes": 0.9975132899986058, "No": 0.0024865867301588304}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6967764648931402, "res": {"Yes": 0.6967764648931402, "No": 0.303218109225644}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9982108703040922, "res": {"Yes": 0.9982108703040922, "No": 0.0017889954818066925}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9924178847617562, "res": {"Yes": 0.9924178847617562, "No": 0.007580588074116056}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998771606953653, "res": {"Yes": 0.9998771606953653, "No": 0.00012257309647736725}, "ground_truth": 1}, {"key": "37592684", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999985978860297, "res": {"Yes": 0.999985978860297, "No": 1.3939374841707097e-05}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993328204333302, "res": {"Yes": 0.9993328204333302, "No": 0.0006668569518780473}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9979243438597377, "res": {"Yes": 0.9979243438597377, "No": 0.0020755149238765895}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8492231827571916, "res": {"Yes": 0.8492231827571916, "No": 0.15077364599306767}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7513014271761113, "res": {"Yes": 0.7513014271761113, "No": 0.2486969977546912}, "ground_truth": 1}, {"key": "38951040", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9855544280951634, "res": {"Yes": 0.9855544280951634, "No": 0.014444961649499495}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9404406405615168, "res": {"Yes": 0.9404406405615168, "No": 0.059556311632875863}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.49297160645281923, "res": {"No": 0.5070239691897855, "Yes": 0.49297160645281923}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.497282253301579, "res": {"No": 0.5027143162370195, "Yes": 0.497282253301579}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8890041725030504, "res": {"Yes": 0.8890041725030504, "No": 0.11099423677096955}, "ground_truth": 1}, {"key": "40774469", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3737662563396451, "res": {"No": 0.6262320435300808, "Yes": 0.3737662563396451}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7465900796196432, "res": {"Yes": 0.7465900796196432, "No": 0.2534086185580604}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.15086569123396554, "res": {"No": 0.8491324056510776, "Yes": 0.15086569123396554}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9920131031142235, "res": {"Yes": 0.9920131031142235, "No": 0.00798616747090004}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5618873691154391, "res": {"Yes": 0.5618873691154391, "No": 0.43811109903708856}, "ground_truth": 1}, {"key": "40876288", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9939180772257211, "res": {"Yes": 0.9939180772257211, "No": 0.006080723459703547}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971684743521416, "res": {"Yes": 0.9971684743521416, "No": 0.0028305605860504423}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7209424677191922, "res": {"Yes": 0.7209424677191922, "No": 0.27905616756085083}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9907008014797474, "res": {"Yes": 0.9907008014797474, "No": 0.009290623622923336}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9970507835085564, "res": {"Yes": 0.9970507835085564, "No": 0.0029415677248748285}, "ground_truth": 1}, {"key": "40340131", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9186162842496176, "res": {"Yes": 0.9186162842496176, "No": 0.08137026235956345}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9937283812174195, "res": {"Yes": 0.9937283812174195, "No": 0.006262818221811616}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9987858584669796, "res": {"Yes": 0.9987858584669796, "No": 0.0012136988273866887}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9869682551840371, "res": {"Yes": 0.9869682551840371, "No": 0.013031471011653452}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999847868417213, "res": {"Yes": 0.9999847868417213, "No": 1.458800415784085e-05}, "ground_truth": 1}, {"key": "30121591", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989614181997918, "res": {"Yes": 0.9989614181997918, "No": 0.0010373602642401538}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.998500426984919, "res": {"Yes": 0.998500426984919, "No": 0.001498987348286044}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1805502403589129, "res": {"No": 0.8194487916991676, "Yes": 0.1805502403589129}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9955607736237245, "res": {"Yes": 0.9955607736237245, "No": 0.004438666435578449}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6698149089909637, "res": {"Yes": 0.6698149089909637, "No": 0.33017885054056045}, "ground_truth": 1}, {"key": "35623366", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9649910763419011, "res": {"Yes": 0.9649910763419011, "No": 0.03500648321262898}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.826972481171496, "res": {"Yes": 0.826972481171496, "No": 0.17302508413415513}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9941510699823961, "res": {"Yes": 0.9941510699823961, "No": 0.005848588084182046}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999543908301298, "res": {"Yes": 0.9999543908301298, "No": 4.554025034903622e-05}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999920539107184, "res": {"Yes": 0.999920539107184, "No": 7.93930281691717e-05}, "ground_truth": 1}, {"key": "41014093", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994556944480424, "res": {"Yes": 0.9994556944480424, "No": 0.0005441778687149775}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999100500717374, "res": {"Yes": 0.9999100500717374, "No": 8.984685033961977e-05}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.04637194204310412, "res": {"No": 0.9536275505418899, "Yes": 0.04637194204310412}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9963757486107451, "res": {"Yes": 0.9963757486107451, "No": 0.0036238872620178923}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9972877316641645, "res": {"Yes": 0.9972877316641645, "No": 0.0027121868873866434}, "ground_truth": 1}, {"key": "11387984", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9623293223241486, "res": {"Yes": 0.9623293223241486, "No": 0.037670537075497924}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8289893671872213, "res": {"Yes": 0.8289893671872213, "No": 0.1710102983540837}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.021034178850428745, "res": {"No": 0.978965099714236, "Yes": 0.021034178850428745}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9871345654498708, "res": {"Yes": 0.9871345654498708, "No": 0.01286232607216102}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.45590984379090577, "res": {"No": 0.5440045326955333, "Yes": 0.45590984379090577}, "ground_truth": 1}, {"key": "39508312", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9649320178003541, "res": {"Yes": 0.9649320178003541, "No": 0.035052175463338824}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9965493954664356, "res": {"Yes": 0.9965493954664356, "No": 0.0034475549821917123}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.010579105525813277, "res": {"No": 0.989420561121572, "Yes": 0.010579105525813277}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989215674268243, "res": {"Yes": 0.9989215674268243, "No": 0.001078073097880195}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9514238185818833, "res": {"Yes": 0.9514238185818833, "No": 0.04857393542829839}, "ground_truth": 1}, {"key": "35815369", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9942762066818196, "res": {"Yes": 0.9942762066818196, "No": 0.005723292656264752}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9219729216499926, "res": {"Yes": 0.9219729216499926, "No": 0.07802562348663465}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09753724245640034, "res": {"No": 0.9024543876971892, "Yes": 0.09753724245640034}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.14991102912937332, "res": {"No": 0.8500849783206579, "Yes": 0.14991102912937332}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7894896302117469, "res": {"Yes": 0.7894896302117469, "No": 0.21050998338020038}, "ground_truth": 1}, {"key": "35802823", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4671990410580897, "res": {"No": 0.5327993924783206, "Yes": 0.4671990410580897}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9677763033421729, "res": {"Yes": 0.9677763033421729, "No": 0.03222310619745544}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9462003366439115, "res": {"Yes": 0.9462003366439115, "No": 0.05379635849885932}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9394481223631871, "res": {"Yes": 0.9394481223631871, "No": 0.06054711843249173}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995299958465729, "res": {"Yes": 0.9995299958465729, "No": 0.00046958957004172977}, "ground_truth": 1}, {"key": "38499968", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995849060953229, "res": {"Yes": 0.9995849060953229, "No": 0.0004145352685650723}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.971983605921346, "res": {"Yes": 0.971983605921346, "No": 0.02801335270941887}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9988917130041798, "res": {"Yes": 0.9988917130041798, "No": 0.0011077053008461079}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988444940117654, "res": {"Yes": 0.9988444940117654, "No": 0.0011553367720227108}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9964926890344542, "res": {"Yes": 0.9964926890344542, "No": 0.0035058835763788097}, "ground_truth": 1}, {"key": "36926726", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982575578180987, "res": {"Yes": 0.9982575578180987, "No": 0.0017411943381250184}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9054318832991101, "res": {"Yes": 0.9054318832991101, "No": 0.09456678258990928}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0454163457584885, "res": {"No": 0.9545829227504643, "Yes": 0.0454163457584885}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990802688122431, "res": {"Yes": 0.9990802688122431, "No": 0.0009193662352800352}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999741197265207, "res": {"Yes": 0.999741197265207, "No": 0.0002587089172250735}, "ground_truth": 1}, {"key": "40903712", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997445341369622, "res": {"Yes": 0.9997445341369622, "No": 0.00025533120817521483}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987778998733319, "res": {"Yes": 0.9987778998733319, "No": 0.001221697492529613}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5093901261085918, "res": {"Yes": 0.5093901261085918, "No": 0.4906031629857873}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9912276039832982, "res": {"Yes": 0.9912276039832982, "No": 0.008770298821775643}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9292362247186916, "res": {"Yes": 0.9292362247186916, "No": 0.07075970349432471}, "ground_truth": 1}, {"key": "19614862", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9819853826731655, "res": {"Yes": 0.9819853826731655, "No": 0.01801122687928176}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9904047510115035, "res": {"Yes": 0.9904047510115035, "No": 0.009594159989940319}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 3.348720943335577e-05, "res": {"No": 0.9999661915245194, "Yes": 3.348720943335577e-05}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9177456513484691, "res": {"Yes": 0.9177456513484691, "No": 0.08225139738481023}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7689412117946464, "res": {"Yes": 0.7689412117946464, "No": 0.2310480688149681}, "ground_truth": 1}, {"key": "38861704", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.48393015041724186, "res": {"No": 0.5160339092804329, "Yes": 0.48393015041724186}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9496126503579321, "res": {"Yes": 0.9496126503579321, "No": 0.05038026238262882}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09833974598794519, "res": {"No": 0.9016595943543841, "Yes": 0.09833974598794519}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9963547993334049, "res": {"Yes": 0.9963547993334049, "No": 0.0036443272443786295}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987147589306589, "res": {"Yes": 0.9987147589306589, "No": 0.00128507139739934}, "ground_truth": 1}, {"key": "34349607", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995201103039121, "res": {"Yes": 0.9995201103039121, "No": 0.0004790785435439042}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990144778462579, "res": {"Yes": 0.9990144778462579, "No": 0.0009849211211987784}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9972590433998094, "res": {"Yes": 0.9972590433998094, "No": 0.0027407518456480495}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7462185419535344, "res": {"Yes": 0.7462185419535344, "No": 0.25378059105770095}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994721284232504, "res": {"Yes": 0.9994721284232504, "No": 0.0005277338886906472}, "ground_truth": 1}, {"key": "20773800", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990078164399288, "res": {"Yes": 0.9990078164399288, "No": 0.0009919052196021396}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999626155448161, "res": {"Yes": 0.9999626155448161, "No": 3.719712814754811e-05}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9892304968481556, "res": {"Yes": 0.9892304968481556, "No": 0.010768705392570408}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997415548027153, "res": {"Yes": 0.9997415548027153, "No": 0.00025801908575091213}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999561916926424, "res": {"Yes": 0.999561916926424, "No": 0.00043754263740040944}, "ground_truth": 1}, {"key": "35545608", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9979480840637115, "res": {"Yes": 0.9979480840637115, "No": 0.002050631263128731}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988102439216388, "res": {"Yes": 0.9988102439216388, "No": 0.0011889230281457396}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996352839250833, "res": {"Yes": 0.9996352839250833, "No": 0.00036451276009826416}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996601850501834, "res": {"Yes": 0.9996601850501834, "No": 0.0003395424099214722}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993746118867163, "res": {"Yes": 0.9993746118867163, "No": 0.0006252509305018354}, "ground_truth": 1}, {"key": "37258984", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999189987897066, "res": {"Yes": 0.999189987897066, "No": 0.0008097945374041837}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995851443764012, "res": {"Yes": 0.9995851443764012, "No": 0.0004146414446426185}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.998388007957127, "res": {"Yes": 0.998388007957127, "No": 0.0016118177493583818}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9887235333956272, "res": {"Yes": 0.9887235333956272, "No": 0.011276025999444514}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9725526754201028, "res": {"Yes": 0.9725526754201028, "No": 0.02744685196820582}, "ground_truth": 1}, {"key": "37274562", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9965843227430832, "res": {"Yes": 0.9965843227430832, "No": 0.003415591139708811}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9968700914084847, "res": {"Yes": 0.9968700914084847, "No": 0.003129592733464604}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9786496389111033, "res": {"Yes": 0.9786496389111033, "No": 0.021348431671821145}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9531440714465513, "res": {"Yes": 0.9531440714465513, "No": 0.046854721326328265}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9202031114414198, "res": {"Yes": 0.9202031114414198, "No": 0.07978984805301147}, "ground_truth": 1}, {"key": "40828068", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9814589498816685, "res": {"Yes": 0.9814589498816685, "No": 0.01854079573245153}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9948661614266227, "res": {"Yes": 0.9948661614266227, "No": 0.005131845181333209}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9289677644156372, "res": {"Yes": 0.9289677644156372, "No": 0.07103020996303121}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.813258151756876, "res": {"Yes": 0.813258151756876, "No": 0.18673620994966963}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7941353946841835, "res": {"Yes": 0.7941353946841835, "No": 0.20586276942927173}, "ground_truth": 1}, {"key": "37807180", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.10997243890423705, "res": {"No": 0.8900206538074447, "Yes": 0.10997243890423705}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.026574725076512963, "res": {"No": 0.9734179336806819, "Yes": 0.026574725076512963}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9695187961690008, "res": {"Yes": 0.9695187961690008, "No": 0.03048061107415476}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9872343510420097, "res": {"Yes": 0.9872343510420097, "No": 0.012765270981981358}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987771854477556, "res": {"Yes": 0.9987771854477556, "No": 0.001222801550447302}, "ground_truth": 1}, {"key": "40748607", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9962174256259744, "res": {"Yes": 0.9962174256259744, "No": 0.0037824799993342972}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977679011458338, "res": {"Yes": 0.9977679011458338, "No": 0.0022320846713275487}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6482790322432935, "res": {"Yes": 0.6482790322432935, "No": 0.3517204834293904}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9740802008445292, "res": {"Yes": 0.9740802008445292, "No": 0.025918978966460466}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9804759617151646, "res": {"Yes": 0.9804759617151646, "No": 0.019523484591892244}, "ground_truth": 1}, {"key": "40123819", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8734444903217656, "res": {"Yes": 0.8734444903217656, "No": 0.12655321339725867}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9546384371799314, "res": {"Yes": 0.9546384371799314, "No": 0.04536045448963827}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8582241126904271, "res": {"Yes": 0.8582241126904271, "No": 0.14177542321063863}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.936426255493422, "res": {"Yes": 0.936426255493422, "No": 0.06357309072354177}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9978237978688678, "res": {"Yes": 0.9978237978688678, "No": 0.0021755897538520206}, "ground_truth": 1}, {"key": "38453867", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994884434896718, "res": {"Yes": 0.9994884434896718, "No": 0.0005115035664833151}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994160403408493, "res": {"Yes": 0.9994160403408493, "No": 0.0005834093931252002}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.985620775881329, "res": {"Yes": 0.985620775881329, "No": 0.014378920486313063}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.720245588494864, "res": {"Yes": 0.720245588494864, "No": 0.27975372959314215}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.29226571722722733, "res": {"No": 0.7077327700289959, "Yes": 0.29226571722722733}, "ground_truth": 1}, {"key": "38944856", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971151286617722, "res": {"Yes": 0.9971151286617722, "No": 0.0028845173193611097}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.005148005092652544, "res": {"No": 0.9948482267380425, "Yes": 0.005148005092652544}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9976687009086275, "res": {"Yes": 0.9976687009086275, "No": 0.0023298439218003377}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9979783605713367, "res": {"Yes": 0.9979783605713367, "No": 0.0020210118038075497}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8680984926189045, "res": {"Yes": 0.8680984926189045, "No": 0.1318787287856094}, "ground_truth": 1}, {"key": "35778898", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9965195623133968, "res": {"Yes": 0.9965195623133968, "No": 0.003479476595846078}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9805088474304109, "res": {"Yes": 0.9805088474304109, "No": 0.019489167121663854}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9960764303923312, "res": {"Yes": 0.9960764303923312, "No": 0.003922875688983381}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9775970452718198, "res": {"Yes": 0.9775970452718198, "No": 0.022402594520959565}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984768934059902, "res": {"Yes": 0.9984768934059902, "No": 0.0015229633038623548}, "ground_truth": 1}, {"key": "32530125", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7214324713146304, "res": {"Yes": 0.7214324713146304, "No": 0.2785659620729694}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.991870124650246, "res": {"Yes": 0.991870124650246, "No": 0.008129409421035695}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.49747048041160574, "res": {"No": 0.5025287131923899, "Yes": 0.49747048041160574}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.928001880311734, "res": {"Yes": 0.928001880311734, "No": 0.07199132883974578}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9931066233762386, "res": {"Yes": 0.9931066233762386, "No": 0.006891517303405153}, "ground_truth": 1}, {"key": "35010363", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8722593409013453, "res": {"Yes": 0.8722593409013453, "No": 0.12772449724540927}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9967216756786296, "res": {"Yes": 0.9967216756786296, "No": 0.0032776092812966764}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9661274767178475, "res": {"Yes": 0.9661274767178475, "No": 0.033872093642309316}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9487311108338818, "res": {"Yes": 0.9487311108338818, "No": 0.05126321707839654}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99826872518821, "res": {"Yes": 0.99826872518821, "No": 0.0017300369713123835}, "ground_truth": 1}, {"key": "27514800", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994240187409277, "res": {"Yes": 0.9994240187409277, "No": 0.000575667684725838}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9934784114698891, "res": {"Yes": 0.9934784114698891, "No": 0.00652130023747546}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9782297708713835, "res": {"Yes": 0.9782297708713835, "No": 0.021769286037033493}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995678744931329, "res": {"Yes": 0.9995678744931329, "No": 0.0004319697479784018}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999343657340227, "res": {"Yes": 0.9999343657340227, "No": 6.527391927551617e-05}, "ground_truth": 1}, {"key": "25725840", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998823976956932, "res": {"Yes": 0.9998823976956932, "No": 0.00011740870559970918}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999906712677533, "res": {"Yes": 0.999906712677533, "No": 9.301488721885291e-05}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9997284495365032, "res": {"Yes": 0.9997284495365032, "No": 0.0002713497442404969}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6170062040135451, "res": {"Yes": 0.6170062040135451, "No": 0.3829880466805048}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8321636856093306, "res": {"Yes": 0.8321636856093306, "No": 0.16782736788603195}, "ground_truth": 1}, {"key": "38327225", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9985187313629711, "res": {"Yes": 0.9985187313629711, "No": 0.0014808330173288315}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984128449648547, "res": {"Yes": 0.9984128449648547, "No": 0.0015859965992540425}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7396829208114134, "res": {"Yes": 0.7396829208114134, "No": 0.2603136314822317}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9626557670674335, "res": {"Yes": 0.9626557670674335, "No": 0.03733945636598948}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9954048327361495, "res": {"Yes": 0.9954048327361495, "No": 0.004594821364459181}, "ground_truth": 1}, {"key": "11991724", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9868696679013748, "res": {"Yes": 0.9868696679013748, "No": 0.013129159584360891}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9910292306223657, "res": {"Yes": 0.9910292306223657, "No": 0.008969704917969248}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.12559261807041242, "res": {"No": 0.8744068484323791, "Yes": 0.12559261807041242}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997407205887178, "res": {"Yes": 0.9997407205887178, "No": 0.0002588183742455874}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9953805068323902, "res": {"Yes": 0.9953805068323902, "No": 0.004618995600560112}, "ground_truth": 1}, {"key": "32217545", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996610191669898, "res": {"Yes": 0.9996610191669898, "No": 0.000338708399234346}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9861831994293663, "res": {"Yes": 0.9861831994293663, "No": 0.013815971513340655}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9299355651686761, "res": {"Yes": 0.9299355651686761, "No": 0.0700641029187033}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.994693799878926, "res": {"Yes": 0.994693799878926, "No": 0.0053053899685229075}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9087068573312691, "res": {"Yes": 0.9087068573312691, "No": 0.09129244901537492}, "ground_truth": 1}, {"key": "12731847", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989942518040874, "res": {"Yes": 0.9989942518040874, "No": 0.0010055999001320954}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.035497191439881816, "res": {"No": 0.9645021090130685, "Yes": 0.035497191439881816}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.17382921235175194, "res": {"No": 0.8261668733650154, "Yes": 0.17382921235175194}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.35075689581263364, "res": {"No": 0.6492413834963794, "Yes": 0.35075689581263364}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9882994095897553, "res": {"Yes": 0.9882994095897553, "No": 0.01169833798304579}, "ground_truth": 1}, {"key": "36827234", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9867423344023868, "res": {"Yes": 0.9867423344023868, "No": 0.013257511254999035}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7766325881279588, "res": {"Yes": 0.7766325881279588, "No": 0.22335769033734143}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9445541592210521, "res": {"Yes": 0.9445541592210521, "No": 0.05544129864734088}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.009593140184936977, "res": {"No": 0.9904053373312897, "Yes": 0.009593140184936977}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.14074159915941634, "res": {"No": 0.8592541529819837, "Yes": 0.14074159915941634}, "ground_truth": 1}, {"key": "29111539", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.05189028983772259, "res": {"No": 0.9481093967208675, "Yes": 0.05189028983772259}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5063292143560025, "res": {"Yes": 0.5063292143560025, "No": 0.4936651626554262}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9936998970972224, "res": {"Yes": 0.9936998970972224, "No": 0.006299850978945804}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989149030439262, "res": {"Yes": 0.9989149030439262, "No": 0.0010844218404043756}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988361703756252, "res": {"Yes": 0.9988361703756252, "No": 0.001163589564117778}, "ground_truth": 1}, {"key": "37763052", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.001044444932244396, "res": {"No": 0.9989546379719678, "Yes": 0.001044444932244396}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998315160150211, "res": {"Yes": 0.9998315160150211, "No": 0.00016784275483361366}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2546730788679134, "res": {"No": 0.7453260688844269, "Yes": 0.2546730788679134}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998823976956932, "res": {"Yes": 0.9998823976956932, "No": 0.0001173214446703662}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9887082636672907, "res": {"Yes": 0.9887082636672907, "No": 0.01129052952268162}, "ground_truth": 1}, {"key": "30682335", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998740617908821, "res": {"Yes": 0.9998740617908821, "No": 0.0001250027276125056}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9732843334510006, "res": {"Yes": 0.9732843334510006, "No": 0.026711729578183845}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.010542000005788846, "res": {"No": 0.9894575641636324, "Yes": 0.010542000005788846}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997820633916336, "res": {"Yes": 0.9997820633916336, "No": 0.00021778134567687353}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995142721639788, "res": {"Yes": 0.9995142721639788, "No": 0.0004855263489130444}, "ground_truth": 1}, {"key": "12261276", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999648749133035, "res": {"Yes": 0.999648749133035, "No": 0.00035105909038227667}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999348425128413, "res": {"Yes": 0.9999348425128413, "No": 6.503438031361007e-05}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9172642640333604, "res": {"Yes": 0.9172642640333604, "No": 0.08273458219247616}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9930819380317044, "res": {"Yes": 0.9930819380317044, "No": 0.006917789477859088}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9754751610806954, "res": {"Yes": 0.9754751610806954, "No": 0.024520891757469965}, "ground_truth": 1}, {"key": "36912979", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9935062968132833, "res": {"Yes": 0.9935062968132833, "No": 0.006492144963627474}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9620419271020397, "res": {"Yes": 0.9620419271020397, "No": 0.037956823079873594}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9075092682024688, "res": {"Yes": 0.9075092682024688, "No": 0.09248854314746682}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7447909827753454, "res": {"Yes": 0.7447909827753454, "No": 0.2552057746062676}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9644115079405469, "res": {"Yes": 0.9644115079405469, "No": 0.03558360432071736}, "ground_truth": 1}, {"key": "30205259", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9954187686008998, "res": {"Yes": 0.9954187686008998, "No": 0.004580376861824723}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.56534619554701, "res": {"Yes": 0.56534619554701, "No": 0.4346515297347046}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995941965005223, "res": {"Yes": 0.9995941965005223, "No": 0.0004055811017870474}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.00014740288585626208, "res": {"No": 0.9998524888808352, "Yes": 0.00014740288585626208}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998910985741908, "res": {"Yes": 0.9998910985741908, "No": 0.00010875749182755397}, "ground_truth": 1}, {"key": "39458032", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999608011247674, "res": {"Yes": 0.999608011247674, "No": 0.0003915068288113881}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.994937187755612, "res": {"Yes": 0.994937187755612, "No": 0.005061807226812024}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.35726302634848733, "res": {"No": 0.6427306874755726, "Yes": 0.35726302634848733}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9928933942012707, "res": {"Yes": 0.9928933942012707, "No": 0.007105795217860523}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986740958886192, "res": {"Yes": 0.9986740958886192, "No": 0.0013253804880158943}, "ground_truth": 1}, {"key": "35116452", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9519690740119453, "res": {"Yes": 0.9519690740119453, "No": 0.048028216357678045}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9909980870271261, "res": {"Yes": 0.9909980870271261, "No": 0.009001401423912432}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9913387724276063, "res": {"Yes": 0.9913387724276063, "No": 0.008660697646591062}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8864075814019757, "res": {"Yes": 0.8864075814019757, "No": 0.11358445748150649}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999220815192263, "res": {"Yes": 0.999220815192263, "No": 0.0007783439783048317}, "ground_truth": 1}, {"key": "40107476", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988154717081366, "res": {"Yes": 0.9988154717081366, "No": 0.001184023138570155}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7326095448419542, "res": {"Yes": 0.7326095448419542, "No": 0.26738706198065226}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0817366324505231, "res": {"No": 0.9182156803886414, "Yes": 0.0817366324505231}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.49809985998555384, "res": {"No": 0.5018916094671703, "Yes": 0.49809985998555384}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.07229720564580083, "res": {"No": 0.9276953469680338, "Yes": 0.07229720564580083}, "ground_truth": 1}, {"key": "39501049", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7165282318842056, "res": {"Yes": 0.7165282318842056, "No": 0.2834711853378089}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7849764041964196, "res": {"Yes": 0.7849764041964196, "No": 0.21501112672161815}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0053048472548894035, "res": {"No": 0.9946941559793702, "Yes": 0.0053048472548894035}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.4343258153165994, "res": {"No": 0.5656730035354895, "Yes": 0.4343258153165994}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.936690482021455, "res": {"Yes": 0.936690482021455, "No": 0.0633073717035745}, "ground_truth": 1}, {"key": "39642178", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.037150765588340934, "res": {"No": 0.9628353248877111, "Yes": 0.037150765588340934}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8470131830901727, "res": {"Yes": 0.8470131830901727, "No": 0.15297978354697916}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9988745852547103, "res": {"Yes": 0.9988745852547103, "No": 0.0011251303312903324}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999932502087799, "res": {"Yes": 0.9999932502087799, "No": 6.571371469448469e-06}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999765619466755, "res": {"Yes": 0.9999765619466755, "No": 2.3179321300757043e-05}, "ground_truth": 1}, {"key": "38024796", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.794391662771165e-06}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999963211539712, "res": {"Yes": 0.999963211539712, "No": 3.6684215162106735e-05}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9936031459442044, "res": {"Yes": 0.9936031459442044, "No": 0.00639575365647482}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9398520835741323, "res": {"Yes": 0.9398520835741323, "No": 0.06014511821728497}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9958469100304851, "res": {"Yes": 0.9958469100304851, "No": 0.004152141723126931}, "ground_truth": 1}, {"key": "36652079", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9621870312832875, "res": {"Yes": 0.9621870312832875, "No": 0.037809212088617816}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6644865910760531, "res": {"Yes": 0.6644865910760531, "No": 0.3354940021759824}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996002734319606, "res": {"Yes": 0.9996002734319606, "No": 0.0003996232219061942}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999975415208221, "res": {"Yes": 0.9999975415208221, "No": 2.429565799283574e-06}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 1.295898864150683e-06}, "ground_truth": 1}, {"key": "32193402", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.6124554328892585e-06}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999971839107652, "res": {"Yes": 0.9999971839107652, "No": 2.7262296061738784e-06}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9876886159026247, "res": {"Yes": 0.9876886159026247, "No": 0.01231013096414954}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994637922108072, "res": {"Yes": 0.9994637922108072, "No": 0.0005350063189588399}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997178470126431, "res": {"Yes": 0.9997178470126431, "No": 0.00028106460613100143}, "ground_truth": 1}, {"key": "32589706", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9688606165571355, "res": {"Yes": 0.9688606165571355, "No": 0.031138863802354092}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983693561467516, "res": {"Yes": 0.9983693561467516, "No": 0.001630015752662567}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.913654616713925, "res": {"Yes": 0.913654616713925, "No": 0.08634478240616869}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9721065997600895, "res": {"Yes": 0.9721065997600895, "No": 0.02789266577948104}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9921819531526166, "res": {"Yes": 0.9921819531526166, "No": 0.007817482556302293}, "ground_truth": 1}, {"key": "38590589", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993650852437295, "res": {"Yes": 0.9993650852437295, "No": 0.0006347472308326695}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9972850047840479, "res": {"Yes": 0.9972850047840479, "No": 0.0027148189850283878}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4855774391775142, "res": {"No": 0.514339461799169, "Yes": 0.4855774391775142}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9963195419499511, "res": {"Yes": 0.9963195419499511, "No": 0.0036666068816109485}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.992254236637685, "res": {"Yes": 0.992254236637685, "No": 0.007744851337029339}, "ground_truth": 1}, {"key": "37045414", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9691078625743617, "res": {"Yes": 0.9691078625743617, "No": 0.030891105018439637}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7067020150062142, "res": {"Yes": 0.7067020150062142, "No": 0.2932875652231285}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0009149513166053764, "res": {"No": 0.9990844371436729, "Yes": 0.0009149513166053764}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 7.172673548604212e-05, "res": {"No": 0.9999281675700725, "Yes": 7.172673548604212e-05}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00023118368274942404, "res": {"No": 0.9997685964079422, "Yes": 0.00023118368274942404}, "ground_truth": 1}, {"key": "33310095", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0001879040683693211, "res": {"No": 0.9998118545815696, "Yes": 0.0001879040683693211}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0018046630148518127, "res": {"No": 0.998195077635021, "Yes": 0.0018046630148518127}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.023338731555036747, "res": {"No": 0.976659737865465, "Yes": 0.023338731555036747}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9910601343686974, "res": {"Yes": 0.9910601343686974, "No": 0.008939478721980684}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996759110281803, "res": {"Yes": 0.9996759110281803, "No": 0.0003239481778085033}, "ground_truth": 1}, {"key": "37934604", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990376706761422, "res": {"Yes": 0.9990376706761422, "No": 0.0009621391222800285}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.996673128142908, "res": {"Yes": 0.996673128142908, "No": 0.003326673577247911}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9800778830257835, "res": {"Yes": 0.9800778830257835, "No": 0.019913607240374706}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9976113896804891, "res": {"Yes": 0.9976113896804891, "No": 0.0023880806762456084}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9931224957303748, "res": {"Yes": 0.9931224957303748, "No": 0.006876867747239502}, "ground_truth": 1}, {"key": "39012181", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7460576521962856, "res": {"Yes": 0.7460576521962856, "No": 0.25393016264141366}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9902928673452543, "res": {"Yes": 0.9902928673452543, "No": 0.009700382124212713}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.003053438336109506, "res": {"No": 0.9969465064233758, "Yes": 0.003053438336109506}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9952697201800955, "res": {"Yes": 0.9952697201800955, "No": 0.0047297189350933525}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8992730718194273, "res": {"Yes": 0.8992730718194273, "No": 0.10072566961242929}, "ground_truth": 1}, {"key": "40221674", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9846103783866005, "res": {"Yes": 0.9846103783866005, "No": 0.015389426442799444}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8497209054030198, "res": {"Yes": 0.8497209054030198, "No": 0.15027673268929134}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5701455841362312, "res": {"Yes": 0.5701455841362312, "No": 0.4298516198333219}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.996445106548478, "res": {"Yes": 0.996445106548478, "No": 0.003553799379695989}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9822276467427722, "res": {"Yes": 0.9822276467427722, "No": 0.01777076655774611}, "ground_truth": 1}, {"key": "36884862", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9569823239226711, "res": {"Yes": 0.9569823239226711, "No": 0.04301115406782404}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.715942745216693, "res": {"Yes": 0.715942745216693, "No": 0.28405542540084766}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.03224297141864406, "res": {"No": 0.9677562047726094, "Yes": 0.03224297141864406}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9888152595549338, "res": {"Yes": 0.9888152595549338, "No": 0.011181805841660909}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9757440800660269, "res": {"Yes": 0.9757440800660269, "No": 0.02425447603180623}, "ground_truth": 1}, {"key": "39054429", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9886272838673222, "res": {"Yes": 0.9886272838673222, "No": 0.011371773531074212}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.991317334958446, "res": {"Yes": 0.991317334958446, "No": 0.008681912851430702}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09002102723464482, "res": {"No": 0.9099782917277618, "Yes": 0.09002102723464482}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9962559973212224, "res": {"Yes": 0.9962559973212224, "No": 0.003743710676232827}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991820114351982, "res": {"Yes": 0.9991820114351982, "No": 0.000817447808536262}, "ground_truth": 1}, {"key": "36753964", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991119226143471, "res": {"Yes": 0.9991119226143471, "No": 0.0008877157212085634}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998198360914665, "res": {"Yes": 0.9998198360914665, "No": 0.00017968881657021323}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2779437010524749, "res": {"No": 0.7220264835101882, "Yes": 0.2779437010524749}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7469673298098812, "res": {"Yes": 0.7469673298098812, "No": 0.25302843633237143}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5126233059155388, "res": {"Yes": 0.5126233059155388, "No": 0.48736609655856145}, "ground_truth": 1}, {"key": "37612459", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9105488130444964, "res": {"Yes": 0.9105488130444964, "No": 0.08944299356891561}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.4181896881463514, "res": {"No": 0.5818072102461366, "Yes": 0.4181896881463514}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2298600347184074, "res": {"No": 0.7701172061028942, "Yes": 0.2298600347184074}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.1958709607673264, "res": {"No": 0.8041016238237215, "Yes": 0.1958709607673264}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.030419592135967424, "res": {"No": 0.9695583504341703, "Yes": 0.030419592135967424}, "ground_truth": 1}, {"key": "36805789", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.007975162135880181, "res": {"No": 0.9919508185508872, "Yes": 0.007975162135880181}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0521927334355054, "res": {"No": 0.9477279485646313, "Yes": 0.0521927334355054}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 2.8712585849040635e-05, "res": {"No": 0.9999707211216348, "Yes": 2.8712585849040635e-05}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9950434081437668, "res": {"Yes": 0.9950434081437668, "No": 0.004956577978706636}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9567964366784598, "res": {"Yes": 0.9567964366784598, "No": 0.04319334269023858}, "ground_truth": 1}, {"key": "12757394", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9961087212234047, "res": {"Yes": 0.9961087212234047, "No": 0.0038896231603125866}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9832791357714107, "res": {"Yes": 0.9832791357714107, "No": 0.016712983609156944}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9917593072085211, "res": {"Yes": 0.9917593072085211, "No": 0.008240238428350087}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.04718599247655224, "res": {"No": 0.9528127932753164, "Yes": 0.04718599247655224}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.35585974516997176, "res": {"No": 0.6441354170887099, "Yes": 0.35585974516997176}, "ground_truth": 1}, {"key": "32192542", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.15894619980927382, "res": {"No": 0.8410458937889058, "Yes": 0.15894619980927382}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9887394989377842, "res": {"Yes": 0.9887394989377842, "No": 0.011258843165036666}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995747780324976, "res": {"Yes": 0.9995747780324976, "No": 0.00042512938503263317}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9801512838069013, "res": {"Yes": 0.9801512838069013, "No": 0.019848431353185855}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999478349506435, "res": {"Yes": 0.9999478349506435, "No": 5.1907565899846e-05}, "ground_truth": 1}, {"key": "34856060", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999892767243843, "res": {"Yes": 0.999892767243843, "No": 0.00010705112862645428}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9963434487249142, "res": {"Yes": 0.9963434487249142, "No": 0.0036564154380284023}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08035628255487196, "res": {"No": 0.9196430034262818, "Yes": 0.08035628255487196}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.10423876436362019, "res": {"No": 0.8957541498375916, "Yes": 0.10423876436362019}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.13739877703468292, "res": {"No": 0.8625992709035251, "Yes": 0.13739877703468292}, "ground_truth": 1}, {"key": "36083416", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9825998420446939, "res": {"Yes": 0.9825998420446939, "No": 0.01739970546854559}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.024988401544164394, "res": {"No": 0.9750099567355216, "Yes": 0.024988401544164394}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.937064142416198, "res": {"Yes": 0.937064142416198, "No": 0.0629347565199766}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9610172626094264, "res": {"Yes": 0.9610172626094264, "No": 0.03898189388551487}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9759553486008057, "res": {"Yes": 0.9759553486008057, "No": 0.02404322083807765}, "ground_truth": 1}, {"key": "33839050", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987656479399816, "res": {"Yes": 0.9987656479399816, "No": 0.001233544433930958}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6820152913880009, "res": {"Yes": 0.6820152913880009, "No": 0.3179830816422878}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.008099353785939017, "res": {"No": 0.9919004971703491, "Yes": 0.008099353785939017}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981961412124428, "res": {"Yes": 0.9981961412124428, "No": 0.0018032133701983125}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988598389780582, "res": {"Yes": 0.9988598389780582, "No": 0.0011397275914481965}, "ground_truth": 1}, {"key": "18464690", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9973490302427211, "res": {"Yes": 0.9973490302427211, "No": 0.002650594034878317}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9979295596247437, "res": {"Yes": 0.9979295596247437, "No": 0.0020700214695403957}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7655403918191124, "res": {"Yes": 0.7655403918191124, "No": 0.23445929224568235}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988353369470724, "res": {"Yes": 0.9988353369470724, "No": 0.0011644097182310178}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9965799417680298, "res": {"Yes": 0.9965799417680298, "No": 0.0034197336878133496}, "ground_truth": 1}, {"key": "39212665", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9756790566957109, "res": {"Yes": 0.9756790566957109, "No": 0.0243204018155424}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9877069860940249, "res": {"Yes": 0.9877069860940249, "No": 0.012289856888750776}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995648957353269, "res": {"Yes": 0.9995648957353269, "No": 0.00043464267553081304}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989755740828662, "res": {"Yes": 0.9989755740828662, "No": 0.0010204505842129911}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9658201366982551, "res": {"Yes": 0.9658201366982551, "No": 0.034176927400366014}, "ground_truth": 1}, {"key": "40094011", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968543347052868, "res": {"Yes": 0.9968543347052868, "No": 0.0031450892841368414}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984313746807904, "res": {"Yes": 0.9984313746807904, "No": 0.0015673092240644964}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9729826873666605, "res": {"Yes": 0.9729826873666605, "No": 0.027016780662882812}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7830564351859164, "res": {"Yes": 0.7830564351859164, "No": 0.21694153189903068}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7915254785268074, "res": {"Yes": 0.7915254785268074, "No": 0.20847305056128423}, "ground_truth": 1}, {"key": "36036272", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978681962282223, "res": {"Yes": 0.9978681962282223, "No": 0.002131686134456004}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9758529401477014, "res": {"Yes": 0.9758529401477014, "No": 0.024145844115664287}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9950652500838172, "res": {"Yes": 0.9950652500838172, "No": 0.004934425629514437}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989948472048389, "res": {"Yes": 0.9989948472048389, "No": 0.0010042161420057325}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998758496172967, "res": {"Yes": 0.9998758496172967, "No": 0.0001239271084850294}, "ground_truth": 1}, {"key": "30681904", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995230889582407, "res": {"Yes": 0.9995230889582407, "No": 0.00047629411780632014}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990871652873251, "res": {"Yes": 0.9990871652873251, "No": 0.0009127054930480345}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0036908850453525556, "res": {"No": 0.9963081768981253, "Yes": 0.0036908850453525556}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998341380566133, "res": {"Yes": 0.9998341380566133, "No": 0.0001657852967226063}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999356768848203, "res": {"Yes": 0.9999356768848203, "No": 6.40782221381466e-05}, "ground_truth": 1}, {"key": "27834240", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993380581802147, "res": {"Yes": 0.9993380581802147, "No": 0.0006618502076915369}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995777568497407, "res": {"Yes": 0.9995777568497407, "No": 0.00042204116554541863}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9988467526014888, "res": {"Yes": 0.9988467526014888, "No": 0.0011525707461865129}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997831359983979, "res": {"Yes": 0.9997831359983979, "No": 0.00021651927163563107}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987862156328665, "res": {"Yes": 0.9987862156328665, "No": 0.0012132130809747155}, "ground_truth": 1}, {"key": "35025075", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999006338731407, "res": {"Yes": 0.9999006338731407, "No": 9.909069659459212e-05}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998819209378813, "res": {"Yes": 0.9998819209378813, "No": 0.00011751612497100135}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6042225250137274, "res": {"Yes": 0.6042225250137274, "No": 0.39577538826428954}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.3820664242579026, "res": {"No": 0.617932840351578, "Yes": 0.3820664242579026}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.993766058149502, "res": {"Yes": 0.993766058149502, "No": 0.006233763721146798}, "ground_truth": 1}, {"key": "33316985", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9754869595241196, "res": {"Yes": 0.9754869595241196, "No": 0.02451239919156251}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0425387863175091, "res": {"No": 0.9574608322790481, "Yes": 0.0425387863175091}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.002699402032349582, "res": {"No": 0.9973003002614593, "Yes": 0.002699402032349582}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9862997317483218, "res": {"Yes": 0.9862997317483218, "No": 0.013699673206126051}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9451094481940894, "res": {"Yes": 0.9451094481940894, "No": 0.054888287262234325}, "ground_truth": 1}, {"key": "17037056", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9749730221079237, "res": {"Yes": 0.9749730221079237, "No": 0.02502456341217425}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5420987492227023, "res": {"Yes": 0.5420987492227023, "No": 0.45789340139675533}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6878283936468302, "res": {"Yes": 0.6878283936468302, "No": 0.31216945924914286}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989972289112933, "res": {"Yes": 0.9989972289112933, "No": 0.0010026036626397121}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983312134752799, "res": {"Yes": 0.9983312134752799, "No": 0.0016685359728687748}, "ground_truth": 1}, {"key": "34050457", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999026480078292, "res": {"Yes": 0.999026480078292, "No": 0.0009730870638272492}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9923243136939309, "res": {"Yes": 0.9923243136939309, "No": 0.007673260163511147}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9658778568001326, "res": {"Yes": 0.9658778568001326, "No": 0.03412152029682663}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9970514965995317, "res": {"Yes": 0.9970514965995317, "No": 0.0029482986612507115}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.978930943238822, "res": {"Yes": 0.978930943238822, "No": 0.021068941283668298}, "ground_truth": 1}, {"key": "34713745", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999030177130861, "res": {"Yes": 0.9999030177130861, "No": 9.672419306322385e-05}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991803440016489, "res": {"Yes": 0.9991803440016489, "No": 0.0008185290254684349}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0001849235613797725, "res": {"No": 0.9998147149373978, "Yes": 0.0001849235613797725}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9527201662709923, "res": {"Yes": 0.9527201662709923, "No": 0.04727688935654156}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3994605488364912, "res": {"No": 0.6005174372491558, "Yes": 0.3994605488364912}, "ground_truth": 1}, {"key": "40856210", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6655825944382353, "res": {"Yes": 0.6655825944382353, "No": 0.3344079246287175}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9770789496154656, "res": {"Yes": 0.9770789496154656, "No": 0.0229193396186617}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0011099110522242851, "res": {"No": 0.9988898115157246, "Yes": 0.0011099110522242851}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9882931240254983, "res": {"Yes": 0.9882931240254983, "No": 0.011705988857217343}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8051163321635642, "res": {"Yes": 0.8051163321635642, "No": 0.19487941428136285}, "ground_truth": 1}, {"key": "40848302", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8772690492684504, "res": {"Yes": 0.8772690492684504, "No": 0.12272805577248387}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5754103733268465, "res": {"Yes": 0.5754103733268465, "No": 0.42458702005453325}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0020166551628412626, "res": {"No": 0.9979794275105723, "Yes": 0.0020166551628412626}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9934031170048984, "res": {"Yes": 0.9934031170048984, "No": 0.006595807889580127}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995457161181841, "res": {"Yes": 0.9995457161181841, "No": 0.0004527540572018188}, "ground_truth": 1}, {"key": "40636168", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986563838615248, "res": {"Yes": 0.9986563838615248, "No": 0.0013426070439151677}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.993840236113271, "res": {"Yes": 0.993840236113271, "No": 0.006158752735139058}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0014512205761351268, "res": {"No": 0.9985482029783991, "Yes": 0.0014512205761351268}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9908298773972215, "res": {"Yes": 0.9908298773972215, "No": 0.009169437829417964}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999944378229948, "res": {"Yes": 0.999944378229948, "No": 5.531801134634317e-05}, "ground_truth": 1}, {"key": "34423311", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997553789246155, "res": {"Yes": 0.9997553789246155, "No": 0.00024436440100787774}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978973958754451, "res": {"Yes": 0.9978973958754451, "No": 0.002102367895911701}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.046109116207195995, "res": {"No": 0.9538896329099025, "Yes": 0.046109116207195995}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980146906388544, "res": {"Yes": 0.9980146906388544, "No": 0.0019843993601052815}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6075890683174318, "res": {"Yes": 0.6075890683174318, "No": 0.392402727696041}, "ground_truth": 1}, {"key": "34833945", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004878588708602783, "res": {"No": 0.9951135308259432, "Yes": 0.004878588708602783}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.021043353856290033, "res": {"No": 0.9789550457942888, "Yes": 0.021043353856290033}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0010109450424659729, "res": {"No": 0.9989858078408604, "Yes": 0.0010109450424659729}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.04992262361059578, "res": {"No": 0.9500759853568397, "Yes": 0.04992262361059578}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9938629585423397, "res": {"Yes": 0.9938629585423397, "No": 0.006133619171943639}, "ground_truth": 1}, {"key": "21272328", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9923906508068796, "res": {"Yes": 0.9923906508068796, "No": 0.007607520359166613}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6673331917085856, "res": {"Yes": 0.6673331917085856, "No": 0.3326554531076998}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7433758184231556, "res": {"Yes": 0.7433758184231556, "No": 0.2566089880344443}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9812602226034143, "res": {"Yes": 0.9812602226034143, "No": 0.0187378881617027}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9841896684641926, "res": {"Yes": 0.9841896684641926, "No": 0.015807828294067034}, "ground_truth": 1}, {"key": "38648957", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995339277054509, "res": {"Yes": 0.9995339277054509, "No": 0.0004652158809522194}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9723184322277237, "res": {"Yes": 0.9723184322277237, "No": 0.027676884742397417}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9478900893052961, "res": {"Yes": 0.9478900893052961, "No": 0.05210856230811242}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.824990753985963, "res": {"Yes": 0.824990753985963, "No": 0.17500526846456235}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9945493344782607, "res": {"Yes": 0.9945493344782607, "No": 0.005450319762553254}, "ground_truth": 1}, {"key": "24942981", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9947038277360776, "res": {"Yes": 0.9947038277360776, "No": 0.005295822376978713}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996813889672788, "res": {"Yes": 0.9996813889672788, "No": 0.00031723840515895095}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 3.714206485695121e-06, "res": {"No": 0.9999959918780326, "Yes": 3.714206485695121e-06}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5729179306570724, "res": {"Yes": 0.5729179306570724, "No": 0.42707565647842044}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8133084695952915, "res": {"Yes": 0.8133084695952915, "No": 0.18668437917223238}, "ground_truth": 1}, {"key": "35882366", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1615390451347107, "res": {"No": 0.8384536135503894, "Yes": 0.1615390451347107}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.049567718194214024, "res": {"No": 0.9504231381248702, "Yes": 0.049567718194214024}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9938384658866191, "res": {"Yes": 0.9938384658866191, "No": 0.006161114453650221}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998426001486566, "res": {"Yes": 0.9998426001486566, "No": 0.0001572850175582425}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996767451980956, "res": {"Yes": 0.9996767451980956, "No": 0.00032305983636325805}, "ground_truth": 1}, {"key": "40559523", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992891321163796, "res": {"Yes": 0.9992891321163796, "No": 0.0007107697644079193}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999757275415809, "res": {"Yes": 0.9999757275415809, "No": 2.412605936984248e-05}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0016576489096999237, "res": {"No": 0.9983381048795986, "Yes": 0.0016576489096999237}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9530557133679891, "res": {"Yes": 0.9530557133679891, "No": 0.046943759507516405}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995011844998384, "res": {"Yes": 0.9995011844998384, "No": 0.0004986974294136879}, "ground_truth": 1}, {"key": "24632722", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998234115535755, "res": {"Yes": 0.9998234115535755, "No": 0.00017638084653858913}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999250684975053, "res": {"Yes": 0.9999250684975053, "No": 7.462693924921554e-05}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9987810998629715, "res": {"Yes": 0.9987810998629715, "No": 0.0012178393682009399}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998257952254141, "res": {"Yes": 0.9998257952254141, "No": 0.00017376130689187658}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984988868990482, "res": {"Yes": 0.9984988868990482, "No": 0.0015002552780307864}, "ground_truth": 1}, {"key": "36002759", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991323857550809, "res": {"Yes": 0.9991323857550809, "No": 0.0008671401022049314}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984492055263988, "res": {"Yes": 0.9984492055263988, "No": 0.001549455035303586}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7511678877037564, "res": {"Yes": 0.7511678877037564, "No": 0.24881217112522946}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9960240326718884, "res": {"Yes": 0.9960240326718884, "No": 0.003974985017759707}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7182734735999764, "res": {"Yes": 0.7182734735999764, "No": 0.2817180305319243}, "ground_truth": 1}, {"key": "29508534", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988056041591892, "res": {"Yes": 0.9988056041591892, "No": 0.0011935621975138718}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9764111119476269, "res": {"Yes": 0.9764111119476269, "No": 0.023585772710227625}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9992863924390719, "res": {"Yes": 0.9992863924390719, "No": 0.0007130813847175721}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999932458601023, "res": {"Yes": 0.999932458601023, "No": 6.71313775226472e-05}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999380608083109, "res": {"Yes": 0.9999380608083109, "No": 6.180693394730352e-05}, "ground_truth": 1}, {"key": "15631612", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999768003491161, "res": {"Yes": 0.9999768003491161, "No": 2.2964339540380755e-05}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992196240817924, "res": {"Yes": 0.9992196240817924, "No": 0.000779781738401854}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977783455355569, "res": {"Yes": 0.9977783455355569, "No": 0.0022216080465868654}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999635045582071, "res": {"Yes": 0.999635045582071, "No": 0.0003647908800279442}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998710820706306, "res": {"Yes": 0.9998710820706306, "No": 0.0001288730173541999}, "ground_truth": 1}, {"key": "40731892", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997401283924773, "res": {"Yes": 0.9997401283924773, "No": 0.0002597915446160725}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997821825756604, "res": {"Yes": 0.9997821825756604, "No": 0.00021771515021000855}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9678167233635472, "res": {"Yes": 0.9678167233635472, "No": 0.032181954589465774}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9893322365223786, "res": {"Yes": 0.9893322365223786, "No": 0.010666780425678828}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980069761149135, "res": {"Yes": 0.9980069761149135, "No": 0.0019928888689371865}, "ground_truth": 1}, {"key": "35971910", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7591045986109206, "res": {"Yes": 0.7591045986109206, "No": 0.24089153717779294}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9606628798133391, "res": {"Yes": 0.9606628798133391, "No": 0.03933506573674356}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.11156428579614257, "res": {"No": 0.8884341125158248, "Yes": 0.11156428579614257}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9953617251748029, "res": {"Yes": 0.9953617251748029, "No": 0.004637552640786568}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999752995450648, "res": {"Yes": 0.999752995450648, "No": 0.00024576346720775845}, "ground_truth": 1}, {"key": "34428424", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.986272141385534, "res": {"Yes": 0.986272141385534, "No": 0.013726331274085445}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.000523002664116146, "res": {"No": 0.9994618860352804, "Yes": 0.000523002664116146}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5468831057703687, "res": {"Yes": 0.5468831057703687, "No": 0.453114013380425}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.47063633298786867, "res": {"No": 0.5293585968158381, "Yes": 0.47063633298786867}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9334290436282088, "res": {"Yes": 0.9334290436282088, "No": 0.06656957084919256}, "ground_truth": 1}, {"key": "36971005", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9734054019788705, "res": {"Yes": 0.9734054019788705, "No": 0.026593445588630537}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0328454845539595, "res": {"No": 0.9671522502067201, "Yes": 0.0328454845539595}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999856064459714, "res": {"Yes": 0.999856064459714, "No": 0.00014358620089692975}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999402063417121, "res": {"Yes": 0.9999402063417121, "No": 5.9493231987008665e-05}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998913369602558, "res": {"Yes": 0.9998913369602558, "No": 0.00010839376381451499}, "ground_truth": 1}, {"key": "34649067", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999044480253807, "res": {"Yes": 0.9999044480253807, "No": 9.527901222947375e-05}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999387759842665, "res": {"Yes": 0.9999387759842665, "No": 6.100053032355402e-05}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.18702069496290513, "res": {"No": 0.812969943485714, "Yes": 0.18702069496290513}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9240320331778278, "res": {"Yes": 0.9240320331778278, "No": 0.07593196021573072}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990038902470245, "res": {"Yes": 0.9990038902470245, "No": 0.0009959355612627608}, "ground_truth": 1}, {"key": "37355154", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9700169358480124, "res": {"Yes": 0.9700169358480124, "No": 0.02998158257527319}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9300563995464939, "res": {"Yes": 0.9300563995464939, "No": 0.06994181478098697}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.03398698913852721, "res": {"No": 0.9660118913106415, "Yes": 0.03398698913852721}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994253291465832, "res": {"Yes": 0.9994253291465832, "No": 0.0005744353497959672}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994462862160901, "res": {"Yes": 0.9994462862160901, "No": 0.0005534617023439279}, "ground_truth": 1}, {"key": "38674697", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994355711499273, "res": {"Yes": 0.9994355711499273, "No": 0.0005638552434267786}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9969258940695811, "res": {"Yes": 0.9969258940695811, "No": 0.0030734382282412535}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.29437350287480407, "res": {"No": 0.7056186663936124, "Yes": 0.29437350287480407}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9953229837629475, "res": {"Yes": 0.9953229837629475, "No": 0.004671338647921186}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9971996527079431, "res": {"Yes": 0.9971996527079431, "No": 0.0027993262941056786}, "ground_truth": 1}, {"key": "40525767", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.997170837245358, "res": {"Yes": 0.997170837245358, "No": 0.002826413176479532}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997654978299332, "res": {"Yes": 0.9997654978299332, "No": 0.00023285933480268948}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5658629318404588, "res": {"Yes": 0.5658629318404588, "No": 0.4341336686589051}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9424424429620547, "res": {"Yes": 0.9424424429620547, "No": 0.05755518801033982}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9794231040383211, "res": {"Yes": 0.9794231040383211, "No": 0.02057638541116202}, "ground_truth": 1}, {"key": "27165110", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7292052255954509, "res": {"Yes": 0.7292052255954509, "No": 0.27079194055517325}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7026324391939176, "res": {"Yes": 0.7026324391939176, "No": 0.2973657845983039}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9989166891053695, "res": {"Yes": 0.9989166891053695, "No": 0.0010815485740364947}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9979568688397711, "res": {"Yes": 0.9979568688397711, "No": 0.0020410661195811607}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9844995588485598, "res": {"Yes": 0.9844995588485598, "No": 0.015498681859433903}, "ground_truth": 1}, {"key": "35497491", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9910151809005548, "res": {"Yes": 0.9910151809005548, "No": 0.008983205504061734}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985050653297257, "res": {"Yes": 0.9985050653297257, "No": 0.00149294544741132}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9691451419635199, "res": {"Yes": 0.9691451419635199, "No": 0.030853548837363375}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.15342756693019105, "res": {"No": 0.846571259175838, "Yes": 0.15342756693019105}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.83013368906451, "res": {"Yes": 0.83013368906451, "No": 0.16986574317074787}, "ground_truth": 1}, {"key": "40690716", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.211170819910081, "res": {"No": 0.7888262483039123, "Yes": 0.211170819910081}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.04200916374889687, "res": {"No": 0.9579750597634512, "Yes": 0.04200916374889687}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0008881241643750458, "res": {"No": 0.9991064478556914, "Yes": 0.0008881241643750458}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9446478749770837, "res": {"Yes": 0.9446478749770837, "No": 0.05534748826444356}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9879986348164012, "res": {"Yes": 0.9879986348164012, "No": 0.012000643567586495}, "ground_truth": 1}, {"key": "34835193", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9886928784977044, "res": {"Yes": 0.9886928784977044, "No": 0.011306211658543702}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.988911654953534, "res": {"Yes": 0.988911654953534, "No": 0.011086645534230331}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992259295871956, "res": {"Yes": 0.9992259295871956, "No": 0.0007736798503359248}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997879233010868, "res": {"Yes": 0.997879233010868, "No": 0.002120427626554832}, "ground_truth": 1}, {"key": "39471712", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.996774503327361, "res": {"Yes": 0.996774503327361, "No": 0.003225168764584024}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9979783605713367, "res": {"Yes": 0.9979783605713367, "No": 0.0020213816828105443}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8072450268255632, "res": {"Yes": 0.8072450268255632, "No": 0.19274363290549823}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.37910620078463964, "res": {"No": 0.6208841427960424, "Yes": 0.37910620078463964}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.009771596674756243, "res": {"No": 0.9902193334029146, "Yes": 0.009771596674756243}, "ground_truth": 1}, {"key": "39115192", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.18372347592793062, "res": {"No": 0.8162735151882745, "Yes": 0.18372347592793062}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9840717932219161, "res": {"Yes": 0.9840717932219161, "No": 0.01592552676828031}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9962624996064593, "res": {"Yes": 0.9962624996064593, "No": 0.0037370277603283484}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9932276121861776, "res": {"Yes": 0.9932276121861776, "No": 0.006772107098071432}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.994450649249649, "res": {"Yes": 0.994450649249649, "No": 0.0055490474310480415}, "ground_truth": 1}, {"key": "23520673", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978000641138407, "res": {"Yes": 0.9978000641138407, "No": 0.0021997807118889594}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997512078539001, "res": {"Yes": 0.9997512078539001, "No": 0.00024854143149173255}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.699509432734782, "res": {"Yes": 0.699509432734782, "No": 0.30048937000258497}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996438634816706, "res": {"Yes": 0.9996438634816706, "No": 0.00035543008312655295}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992368842810174, "res": {"Yes": 0.9992368842810174, "No": 0.0007627925125735015}, "ground_truth": 1}, {"key": "35764233", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971971598116472, "res": {"Yes": 0.9971971598116472, "No": 0.0028026855400994193}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996471999885653, "res": {"Yes": 0.9996471999885653, "No": 0.00035218533536724946}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9674296421640386, "res": {"Yes": 0.9674296421640386, "No": 0.03256393146165762}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.08538242462598183, "res": {"No": 0.9146061989586409, "Yes": 0.08538242462598183}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985041132555998, "res": {"Yes": 0.9985041132555998, "No": 0.001492380176011281}, "ground_truth": 1}, {"key": "35228910", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9912775076019565, "res": {"Yes": 0.9912775076019565, "No": 0.008719497228548867}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.2296919306169857, "res": {"No": 0.7702647053723768, "Yes": 0.2296919306169857}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9945698571160633, "res": {"Yes": 0.9945698571160633, "No": 0.0054297005168061395}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991907025579686, "res": {"Yes": 0.9991907025579686, "No": 0.0008087360185714909}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9540184062088533, "res": {"Yes": 0.9540184062088533, "No": 0.04597955673871034}, "ground_truth": 1}, {"key": "36795599", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998683407378415, "res": {"Yes": 0.9998683407378415, "No": 0.0001312175401791745}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9287272068509151, "res": {"Yes": 0.9287272068509151, "No": 0.0712228916713592}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.931764950628961, "res": {"Yes": 0.931764950628961, "No": 0.06823438925117703}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9956451387282936, "res": {"Yes": 0.9956451387282936, "No": 0.004354793876969332}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9839488667156149, "res": {"Yes": 0.9839488667156149, "No": 0.016050692241895984}, "ground_truth": 1}, {"key": "38641949", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9737674359261047, "res": {"Yes": 0.9737674359261047, "No": 0.0262315865722425}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9980257364271715, "res": {"Yes": 0.9980257364271715, "No": 0.001973943421965277}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9878703011412567, "res": {"Yes": 0.9878703011412567, "No": 0.0121286810073151}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9776000113057546, "res": {"Yes": 0.9776000113057546, "No": 0.02239881328214996}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988660232381235, "res": {"Yes": 0.9988660232381235, "No": 0.0011332836219221597}, "ground_truth": 1}, {"key": "29968443", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7121807908992648, "res": {"Yes": 0.7121807908992648, "No": 0.2878074496638238}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975298967380918, "res": {"Yes": 0.9975298967380918, "No": 0.0024698385372829597}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9817070440012416, "res": {"Yes": 0.9817070440012416, "No": 0.018291917195711736}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.998886004953684, "res": {"Yes": 0.998886004953684, "No": 0.0011134563196624075}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9960295905014971, "res": {"Yes": 0.9960295905014971, "No": 0.003968508291924887}, "ground_truth": 1}, {"key": "21268042", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9916189673288056, "res": {"Yes": 0.9916189673288056, "No": 0.008380128755399787}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994044916855028, "res": {"Yes": 0.9994044916855028, "No": 0.0005953496964115195}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6123179654506216, "res": {"Yes": 0.6123179654506216, "No": 0.3876793261793746}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9594275734698857, "res": {"Yes": 0.9594275734698857, "No": 0.040570799308430466}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2559286459786408, "res": {"No": 0.744068216134011, "Yes": 0.2559286459786408}, "ground_truth": 1}, {"key": "26808572", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9740358695152397, "res": {"Yes": 0.9740358695152397, "No": 0.025963218905863943}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9554184184038383, "res": {"Yes": 0.9554184184038383, "No": 0.04457842417052054}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9717505240161388, "res": {"Yes": 0.9717505240161388, "No": 0.02824040288479822}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9840398133764233, "res": {"Yes": 0.9840398133764233, "No": 0.01595413876040994}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5779982430617113, "res": {"Yes": 0.5779982430617113, "No": 0.4219604878571545}, "ground_truth": 1}, {"key": "37829390", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8108874936113881, "res": {"Yes": 0.8108874936113881, "No": 0.18905256138872578}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9873557863607169, "res": {"Yes": 0.9873557863607169, "No": 0.012633617025116797}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9993919865751202, "res": {"Yes": 0.9993919865751202, "No": 0.0006078954791919244}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9816811940317012, "res": {"Yes": 0.9816811940317012, "No": 0.018318386440628734}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993561579552968, "res": {"Yes": 0.9993561579552968, "No": 0.000643449700168199}, "ground_truth": 1}, {"key": "35716045", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9895268949156512, "res": {"Yes": 0.9895268949156512, "No": 0.010471786900890415}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9966889900229586, "res": {"Yes": 0.9966889900229586, "No": 0.0033106242904188663}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.970695672885267, "res": {"Yes": 0.970695672885267, "No": 0.029303526846948695}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6994928965272509, "res": {"Yes": 0.6994928965272509, "No": 0.3005051761591454}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9080967619812114, "res": {"Yes": 0.9080967619812114, "No": 0.09190215504539097}, "ground_truth": 1}, {"key": "34367070", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6191304842791914, "res": {"Yes": 0.6191304842791914, "No": 0.38086526559784506}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6495955503427207, "res": {"Yes": 0.6495955503427207, "No": 0.3504011282617497}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.14721219936506968, "res": {"No": 0.8527731590289753, "Yes": 0.14721219936506968}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9501047189393574, "res": {"Yes": 0.9501047189393574, "No": 0.049893098120968725}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9836688520885156, "res": {"Yes": 0.9836688520885156, "No": 0.016330304916602822}, "ground_truth": 1}, {"key": "35239748", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0010126283516055624, "res": {"No": 0.9989824772277291, "Yes": 0.0010126283516055624}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0011400536001563738, "res": {"No": 0.9988522259970354, "Yes": 0.0011400536001563738}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.996404385758025, "res": {"Yes": 0.996404385758025, "No": 0.0035951861819947498}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9820949420196837, "res": {"Yes": 0.9820949420196837, "No": 0.01790410970553071}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9960454423389669, "res": {"Yes": 0.9960454423389669, "No": 0.0039536858839178575}, "ground_truth": 1}, {"key": "40421370", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9936538790262353, "res": {"Yes": 0.9936538790262353, "No": 0.0063458685491823656}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9950621768295381, "res": {"Yes": 0.9950621768295381, "No": 0.00493646396818739}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9950342035372934, "res": {"Yes": 0.9950342035372934, "No": 0.004965312712920491}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9970843129957726, "res": {"Yes": 0.9970843129957726, "No": 0.0029149794760810247}, "ground_truth": 1}, {"key": "37288396", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.995112819320023, "res": {"Yes": 0.995112819320023, "No": 0.00488637138014564}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8397946175140196, "res": {"Yes": 0.8397946175140196, "No": 0.16020119258896912}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9282330093978317, "res": {"Yes": 0.9282330093978317, "No": 0.07176136784701576}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5928413462779853, "res": {"Yes": 0.5928413462779853, "No": 0.407148970347044}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.007840152447301529, "res": {"No": 0.9921557832104665, "Yes": 0.007840152447301529}, "ground_truth": 1}, {"key": "38903688", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7202162030743201, "res": {"Yes": 0.7202162030743201, "No": 0.27975087611965305}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.021223971605420524, "res": {"No": 0.9787288902316372, "Yes": 0.021223971605420524}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0041966256217635, "res": {"No": 0.9958031684156443, "Yes": 0.0041966256217635}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9148003813193754, "res": {"Yes": 0.9148003813193754, "No": 0.08519524981893713}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9691461489058455, "res": {"Yes": 0.9691461489058455, "No": 0.03085157735858208}, "ground_truth": 1}, {"key": "28071228", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9619140725302283, "res": {"Yes": 0.9619140725302283, "No": 0.03808143065663972}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6955519332676063, "res": {"Yes": 0.6955519332676063, "No": 0.3044407780226663}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9949770817558733, "res": {"Yes": 0.9949770817558733, "No": 0.005022828790016004}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997992214587097, "res": {"Yes": 0.9997992214587097, "No": 0.00020038901612723692}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999786707670044, "res": {"Yes": 0.999786707670044, "No": 0.0002126408426938491}, "ground_truth": 1}, {"key": "36855834", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968822908802489, "res": {"Yes": 0.9968822908802489, "No": 0.003117368694943709}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9951890794289928, "res": {"Yes": 0.9951890794289928, "No": 0.0048108716262628025}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.903590150260942, "res": {"Yes": 0.903590150260942, "No": 0.09640629294343858}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7661716256228853, "res": {"Yes": 0.7661716256228853, "No": 0.23381983408219686}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9547657772562076, "res": {"Yes": 0.9547657772562076, "No": 0.0452291359113746}, "ground_truth": 1}, {"key": "40548717", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9431667808536627, "res": {"Yes": 0.9431667808536627, "No": 0.056831160689195394}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.909391425845482, "res": {"Yes": 0.909391425845482, "No": 0.0906052881078694}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9987105958967343, "res": {"Yes": 0.9987105958967343, "No": 0.0012871707323474097}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999217310531738, "res": {"Yes": 0.9999217310531738, "No": 7.761584216502952e-05}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999638075349631, "res": {"Yes": 0.9999638075349631, "No": 3.547511830641926e-05}, "ground_truth": 1}, {"key": "37051175", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999548676244963, "res": {"Yes": 0.9999548676244963, "No": 4.5014045260153474e-05}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.997331003122452, "res": {"Yes": 0.997331003122452, "No": 0.002668574084433115}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9378291119457823, "res": {"Yes": 0.9378291119457823, "No": 0.062168079641933785}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985931389581563, "res": {"Yes": 0.9985931389581563, "No": 0.001406565164702861}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995054700702547, "res": {"Yes": 0.9995054700702547, "No": 0.0004941452775012254}, "ground_truth": 1}, {"key": "38882119", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998705718505707, "res": {"Yes": 0.998705718505707, "No": 0.001293297138632625}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978797086002238, "res": {"Yes": 0.9978797086002238, "No": 0.0021173414717545677}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.797955306494417, "res": {"Yes": 0.797955306494417, "No": 0.20204353196934866}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9912340519398342, "res": {"Yes": 0.9912340519398342, "No": 0.00876530468203279}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990721740968816, "res": {"Yes": 0.9990721740968816, "No": 0.0009269017361617834}, "ground_truth": 1}, {"key": "19485402", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9949783826892582, "res": {"Yes": 0.9949783826892582, "No": 0.005019346665816254}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8934085276009819, "res": {"Yes": 0.8934085276009819, "No": 0.10658484972559248}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.035637978427502395, "res": {"No": 0.9643609451707001, "Yes": 0.035637978427502395}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9377704994579451, "res": {"Yes": 0.9377704994579451, "No": 0.06222801367505641}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9081249679046742, "res": {"Yes": 0.9081249679046742, "No": 0.09187344929622625}, "ground_truth": 1}, {"key": "36060907", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975918156396838, "res": {"Yes": 0.9975918156396838, "No": 0.002407865520652902}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9808623071030287, "res": {"Yes": 0.9808623071030287, "No": 0.019137054445879847}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 8.3962272241221e-05, "res": {"No": 0.9999138642598959, "Yes": 8.3962272241221e-05}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9811233012180288, "res": {"Yes": 0.9811233012180288, "No": 0.018876094476843724}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9909816940723569, "res": {"Yes": 0.9909816940723569, "No": 0.009007056079382625}, "ground_truth": 1}, {"key": "24037309", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9897594689794839, "res": {"Yes": 0.9897594689794839, "No": 0.010234580986335324}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.549435220592239, "res": {"Yes": 0.549435220592239, "No": 0.4505536135611473}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.99990659348666, "res": {"Yes": 0.99990659348666, "No": 9.315190595388718e-05}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9852864508916581, "res": {"Yes": 0.9852864508916581, "No": 0.014711767429836159}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.823550843936138, "res": {"Yes": 0.823550843936138, "No": 0.17644652906163716}, "ground_truth": 1}, {"key": "35605805", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8869660699475314, "res": {"Yes": 0.8869660699475314, "No": 0.11303293981057684}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.06783323584113872, "res": {"No": 0.9321642089086505, "Yes": 0.06783323584113872}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0880518529472118, "res": {"No": 0.9119453216830843, "Yes": 0.0880518529472118}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9460391027061535, "res": {"Yes": 0.9460391027061535, "No": 0.05395940901403007}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8355452944736754, "res": {"Yes": 0.8355452944736754, "No": 0.1644476823151082}, "ground_truth": 1}, {"key": "17706248", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.985585109867639, "res": {"Yes": 0.985585109867639, "No": 0.014412556113548797}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994997547643916, "res": {"Yes": 0.9994997547643916, "No": 0.0004999138871873093}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999752042066651, "res": {"Yes": 0.999752042066651, "No": 0.0002477909774612775}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998248417619957, "res": {"Yes": 0.9998248417619957, "No": 0.00017491227420252854}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996208766254361, "res": {"Yes": 0.9996208766254361, "No": 0.00037867675726479725}, "ground_truth": 1}, {"key": "36883559", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998555877184575, "res": {"Yes": 0.9998555877184575, "No": 0.00014427029056102386}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9917005610941589, "res": {"Yes": 0.9917005610941589, "No": 0.008298675128441844}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004261555689654064, "res": {"No": 0.99573791975415, "Yes": 0.004261555689654064}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996444592895836, "res": {"Yes": 0.9996444592895836, "No": 0.0003549817067848871}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987543522640084, "res": {"Yes": 0.9987543522640084, "No": 0.001245165283556881}, "ground_truth": 1}, {"key": "32799471", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990388615896978, "res": {"Yes": 0.9990388615896978, "No": 0.0009607682818238746}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999482724633057, "res": {"Yes": 0.999482724633057, "No": 0.0005167765406527387}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.10821719570631833, "res": {"No": 0.8917818447320218, "Yes": 0.10821719570631833}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998829936457775, "res": {"Yes": 0.9998829936457775, "No": 0.00011696661567426567}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999961110815618, "res": {"Yes": 0.9999961110815618, "No": 3.8101995304503244e-06}, "ground_truth": 1}, {"key": "34797243", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.685119650191391e-07}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999844292352256, "res": {"Yes": 0.9999844292352256, "No": 1.5494475762265482e-05}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.008381768907080825, "res": {"No": 0.9916163950725406, "Yes": 0.008381768907080825}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6954978353421324, "res": {"Yes": 0.6954978353421324, "No": 0.3044984141170302}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7651432712584735, "res": {"Yes": 0.7651432712584735, "No": 0.23484865349352996}, "ground_truth": 1}, {"key": "32154876", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9027629354390551, "res": {"Yes": 0.9027629354390551, "No": 0.09723505348172394}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9561846337887956, "res": {"Yes": 0.9561846337887956, "No": 0.043812881791995814}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9965022813192465, "res": {"Yes": 0.9965022813192465, "No": 0.003497448067493234}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997272578209124, "res": {"Yes": 0.9997272578209124, "No": 0.000272555035258945}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9972902245874231, "res": {"Yes": 0.9972902245874231, "No": 0.0027094435426231896}, "ground_truth": 1}, {"key": "37962274", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9843826456389537, "res": {"Yes": 0.9843826456389537, "No": 0.015616836248436896}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9959151229006813, "res": {"Yes": 0.9959151229006813, "No": 0.004084542712584634}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9746114375562969, "res": {"Yes": 0.9746114375562969, "No": 0.025387904986550334}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998282980724635, "res": {"Yes": 0.9998282980724635, "No": 0.000171536411832767}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998277043895984, "res": {"Yes": 0.998277043895984, "No": 0.0017225774368597798}, "ground_truth": 1}, {"key": "35574030", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998265872938883, "res": {"Yes": 0.998265872938883, "No": 0.0017339035933617458}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.985850696769313, "res": {"Yes": 0.985850696769313, "No": 0.014147632264854375}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0019698661159271965, "res": {"No": 0.9980295361179884, "Yes": 0.0019698661159271965}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.07564333089525158, "res": {"No": 0.9243374854798531, "Yes": 0.07564333089525158}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00016227210034119248, "res": {"No": 0.9998184059102031, "Yes": 0.00016227210034119248}, "ground_truth": 1}, {"key": "39105949", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.24155004540698907, "res": {"No": 0.7584378360343158, "Yes": 0.24155004540698907}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.11563904734240688, "res": {"No": 0.8843488433605714, "Yes": 0.11563904734240688}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9853072889351592, "res": {"Yes": 0.9853072889351592, "No": 0.014692509101675527}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978935968872904, "res": {"Yes": 0.9978935968872904, "No": 0.002105907686082657}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9573856649798368, "res": {"Yes": 0.9573856649798368, "No": 0.04261355004962805}, "ground_truth": 1}, {"key": "41064322", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984048819552824, "res": {"Yes": 0.9984048819552824, "No": 0.0015945374257685496}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9460367555860513, "res": {"Yes": 0.9460367555860513, "No": 0.05396236607066665}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9839761037811673, "res": {"Yes": 0.9839761037811673, "No": 0.016022264384234874}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9963295966582395, "res": {"Yes": 0.9963295966582395, "No": 0.003669946113476076}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9960274648770161, "res": {"Yes": 0.9960274648770161, "No": 0.003971573163214354}, "ground_truth": 1}, {"key": "28105101", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9849369780816064, "res": {"Yes": 0.9849369780816064, "No": 0.015061451200467717}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9937834812075185, "res": {"Yes": 0.9937834812075185, "No": 0.006215941979609552}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9986924034503466, "res": {"Yes": 0.9986924034503466, "No": 0.0013072925972993515}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991927200259528, "res": {"Yes": 0.9991927200259528, "No": 0.0008070116932680361}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9931925815667434, "res": {"Yes": 0.9931925815667434, "No": 0.006806805217189523}, "ground_truth": 1}, {"key": "36036068", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998217292014919, "res": {"Yes": 0.998217292014919, "No": 0.001782256537245348}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9798263743935223, "res": {"Yes": 0.9798263743935223, "No": 0.02015977896251577}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0003908936616725287, "res": {"No": 0.999608368747547, "Yes": 0.0003908936616725287}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999742971333243, "res": {"Yes": 0.9999742971333243, "No": 2.561741920951413e-05}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993366324256242, "res": {"Yes": 0.9993366324256242, "No": 0.0006632596602710671}, "ground_truth": 1}, {"key": "37991460", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9967460709395244, "res": {"Yes": 0.9967460709395244, "No": 0.0032539185540022297}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994323545216897, "res": {"Yes": 0.9994323545216897, "No": 0.0005674266886211481}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09504253982281208, "res": {"No": 0.9049570725985335, "Yes": 0.09504253982281208}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9910054630533377, "res": {"Yes": 0.9910054630533377, "No": 0.008994160909798179}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9872182138411973, "res": {"Yes": 0.9872182138411973, "No": 0.012781339798042832}, "ground_truth": 1}, {"key": "38437830", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.018511520703327348, "res": {"No": 0.981487888625433, "Yes": 0.018511520703327348}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981133596475252, "res": {"Yes": 0.9981133596475252, "No": 0.0018863251645653927}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.020060371042185318, "res": {"No": 0.9799392274955823, "Yes": 0.020060371042185318}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.025229407513941877, "res": {"No": 0.9747689728350589, "Yes": 0.025229407513941877}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9973332546994663, "res": {"Yes": 0.9973332546994663, "No": 0.00266544728146658}, "ground_truth": 1}, {"key": "36507138", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9605467205992253, "res": {"Yes": 0.9605467205992253, "No": 0.039448265488312574}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9837851315699955, "res": {"Yes": 0.9837851315699955, "No": 0.016212062744064424}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9430763373824557, "res": {"Yes": 0.9430763373824557, "No": 0.056922692707576626}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993749656154227, "res": {"Yes": 0.9993749656154227, "No": 0.0006241811045832464}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998367601050818, "res": {"Yes": 0.9998367601050818, "No": 0.00016259778228942562}, "ground_truth": 1}, {"key": "37824866", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996680461788657, "res": {"Yes": 0.9996680461788657, "No": 0.0003313633667397447}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985351351634304, "res": {"Yes": 0.9985351351634304, "No": 0.0014642362551415366}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5344613295313061, "res": {"Yes": 0.5344613295313061, "No": 0.46553814568721524}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997995789969731, "res": {"Yes": 0.9997995789969731, "No": 0.00020015930169215213}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996480341545159, "res": {"Yes": 0.9996480341545159, "No": 0.00035188751257033486}, "ground_truth": 1}, {"key": "25088134", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9985156404530221, "res": {"Yes": 0.9985156404530221, "No": 0.0014840125164604148}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981917458650512, "res": {"Yes": 0.9981917458650512, "No": 0.0018079096330163955}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995328553860379, "res": {"Yes": 0.9995328553860379, "No": 0.00046672282452558136}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6891467505563109, "res": {"Yes": 0.6891467505563109, "No": 0.31084797894280203}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998110203189099, "res": {"Yes": 0.9998110203189099, "No": 0.0001888170502127845}, "ground_truth": 1}, {"key": "40172531", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997600157708231, "res": {"Yes": 0.9997600157708231, "No": 0.00023964281836235548}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971930065938452, "res": {"Yes": 0.9971930065938452, "No": 0.002806482104639993}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9971537752000016, "res": {"Yes": 0.9971537752000016, "No": 0.0028450916429198976}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998535615431577, "res": {"Yes": 0.9998535615431577, "No": 0.0001462459155654357}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998965813680755, "res": {"Yes": 0.9998965813680755, "No": 0.0001032777083894895}, "ground_truth": 1}, {"key": "37035874", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995832379494402, "res": {"Yes": 0.9995832379494402, "No": 0.0004160936095750272}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999834495597365, "res": {"Yes": 0.999834495597365, "No": 0.00016513900238814328}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9914821948249699, "res": {"Yes": 0.9914821948249699, "No": 0.008517644018762868}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985596152513155, "res": {"Yes": 0.9985596152513155, "No": 0.0014401082422356723}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9870455940855911, "res": {"Yes": 0.9870455940855911, "No": 0.012953930802784985}, "ground_truth": 1}, {"key": "36404465", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994041343484907, "res": {"Yes": 0.9994041343484907, "No": 0.0005955673960535974}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.993236441025662, "res": {"Yes": 0.993236441025662, "No": 0.006763106182566616}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00445922943633136, "res": {"No": 0.9955405722081356, "Yes": 0.00445922943633136}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.055957321213302935, "res": {"No": 0.9440412752601138, "Yes": 0.055957321213302935}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7258868865108952, "res": {"Yes": 0.7258868865108952, "No": 0.27410977887651106}, "ground_truth": 1}, {"key": "39602052", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.954531113213769, "res": {"Yes": 0.954531113213769, "No": 0.04546518548867911}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.17967103203420973, "res": {"No": 0.8203256035813741, "Yes": 0.17967103203420973}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.05812591925848114, "res": {"No": 0.941873478497651, "Yes": 0.05812591925848114}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9274176087339461, "res": {"Yes": 0.9274176087339461, "No": 0.07258058624534129}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9655826639652004, "res": {"Yes": 0.9655826639652004, "No": 0.03441655432428004}, "ground_truth": 1}, {"key": "33792789", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974111720099017, "res": {"Yes": 0.9974111720099017, "No": 0.002588288325324693}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.922007381031895, "res": {"Yes": 0.922007381031895, "No": 0.07799223566528579}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9282257320795652, "res": {"Yes": 0.9282257320795652, "No": 0.07177394871748041}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995969370916878, "res": {"Yes": 0.9995969370916878, "No": 0.0004028591342201428}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.990442642641292, "res": {"Yes": 0.990442642641292, "No": 0.009556901646533783}, "ground_truth": 1}, {"key": "32776626", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997743168702697, "res": {"Yes": 0.9997743168702697, "No": 0.00022552399425581764}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.991380359961402, "res": {"Yes": 0.991380359961402, "No": 0.008619202637803173}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1610126895536762, "res": {"No": 0.8389861922836475, "Yes": 0.1610126895536762}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996791284902776, "res": {"Yes": 0.9996791284902776, "No": 0.0003207444043945895}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999139834496357, "res": {"Yes": 0.9999139834496357, "No": 8.570040556425787e-05}, "ground_truth": 1}, {"key": "37195090", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997544255583407, "res": {"Yes": 0.9997544255583407, "No": 0.0002454432005057912}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997716949855572, "res": {"Yes": 0.9997716949855572, "No": 0.0002281452660714184}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.477428389472037, "res": {"No": 0.5225693378126006, "Yes": 0.477428389472037}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9700803149449788, "res": {"Yes": 0.9700803149449788, "No": 0.029918986503371495}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9936345732144732, "res": {"Yes": 0.9936345732144732, "No": 0.006364799804630057}, "ground_truth": 1}, {"key": "33981824", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9947748428735124, "res": {"Yes": 0.9947748428735124, "No": 0.005224621102649614}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978854074077242, "res": {"Yes": 0.9978854074077242, "No": 0.00211380212096479}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.05090681878786272, "res": {"No": 0.9490862968466692, "Yes": 0.05090681878786272}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7671408016128224, "res": {"Yes": 0.7671408016128224, "No": 0.23285794254504844}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8655485596908558, "res": {"Yes": 0.8655485596908558, "No": 0.1344499860531343}, "ground_truth": 1}, {"key": "39569142", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3707879177865428, "res": {"No": 0.6292079014161227, "Yes": 0.3707879177865428}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.05703496945789547, "res": {"No": 0.9429488053055141, "Yes": 0.05703496945789547}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4210521252578221, "res": {"No": 0.5789472563183672, "Yes": 0.4210521252578221}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9748738753180454, "res": {"Yes": 0.9748738753180454, "No": 0.02512560834901262}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9863160807881757, "res": {"Yes": 0.9863160807881757, "No": 0.013683448708290335}, "ground_truth": 1}, {"key": "40268210", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9977080900455512, "res": {"Yes": 0.9977080900455512, "No": 0.0022918807735582427}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.997533218917192, "res": {"Yes": 0.997533218917192, "No": 0.002466739600763869}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.18701777746282025, "res": {"No": 0.8129819836597343, "Yes": 0.18701777746282025}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6621812294580833, "res": {"Yes": 0.6621812294580833, "No": 0.3378171183164585}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9934526370003298, "res": {"Yes": 0.9934526370003298, "No": 0.006546855637119918}, "ground_truth": 1}, {"key": "34925159", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980966129430131, "res": {"Yes": 0.9980966129430131, "No": 0.0019033305620483817}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6314809524737548, "res": {"Yes": 0.6314809524737548, "No": 0.3685180817630953}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9984326839247104, "res": {"Yes": 0.9984326839247104, "No": 0.0015671141062124385}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9846514246949871, "res": {"Yes": 0.9846514246949871, "No": 0.015348201161375636}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7461155485164442, "res": {"Yes": 0.7461155485164442, "No": 0.2538830375765687}, "ground_truth": 1}, {"key": "36181903", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.053819619692183046, "res": {"No": 0.9461797352482596, "Yes": 0.053819619692183046}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6295137393007573, "res": {"Yes": 0.6295137393007573, "No": 0.37048448906283216}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9978914594014952, "res": {"Yes": 0.9978914594014952, "No": 0.002108458852555197}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9017818135784126, "res": {"Yes": 0.9017818135784126, "No": 0.09821697667493506}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9732148901447292, "res": {"Yes": 0.9732148901447292, "No": 0.02678451116881487}, "ground_truth": 1}, {"key": "38620559", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.995383799556553, "res": {"Yes": 0.995383799556553, "No": 0.004615806361829192}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9854113300684748, "res": {"Yes": 0.9854113300684748, "No": 0.014588554442584856}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0053483242042090574, "res": {"No": 0.994651226900687, "Yes": 0.0053483242042090574}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.012894015370865444, "res": {"No": 0.9871045984736039, "Yes": 0.012894015370865444}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.26255586514325063, "res": {"No": 0.737441202035509, "Yes": 0.26255586514325063}, "ground_truth": 1}, {"key": "32719657", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6473061580729665, "res": {"Yes": 0.6473061580729665, "No": 0.35268953968686223}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.003949900066537131, "res": {"No": 0.9960486332752572, "Yes": 0.003949900066537131}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004520730423834976, "res": {"No": 0.9954790193397276, "Yes": 0.004520730423834976}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8787488539853167, "res": {"Yes": 0.8787488539853167, "No": 0.12124956946196538}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9864338046374487, "res": {"Yes": 0.9864338046374487, "No": 0.013564810537221524}, "ground_truth": 1}, {"key": "37530914", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9797208645320915, "res": {"Yes": 0.9797208645320915, "No": 0.02027900225380028}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9690729336491463, "res": {"Yes": 0.9690729336491463, "No": 0.030925363701897076}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9172785138443872, "res": {"Yes": 0.9172785138443872, "No": 0.08272103137775505}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9853588967412178, "res": {"Yes": 0.9853588967412178, "No": 0.014640680343180742}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998117354140017, "res": {"Yes": 0.9998117354140017, "No": 0.00018794992255598655}, "ground_truth": 1}, {"key": "33306933", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975130520917145, "res": {"Yes": 0.9975130520917145, "No": 0.002486928161955639}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.991430156264696, "res": {"Yes": 0.991430156264696, "No": 0.008569733874543989}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999782307609533, "res": {"Yes": 0.9999782307609533, "No": 2.1699138471070124e-05}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5444257551959185, "res": {"Yes": 0.5444257551959185, "No": 0.45557068190294836}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995193954273944, "res": {"Yes": 0.9995193954273944, "No": 0.0004803886952441711}, "ground_truth": 1}, {"key": "33837212", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997464409015432, "res": {"Yes": 0.9997464409015432, "No": 0.00025341046312158153}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.00020407111947462017, "res": {"No": 0.9997958844344171, "Yes": 0.00020407111947462017}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.773484111675716, "res": {"Yes": 0.773484111675716, "No": 0.22651454948165559}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997859962620674, "res": {"Yes": 0.9997859962620674, "No": 0.00021317694700782733}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8567511636621313, "res": {"Yes": 0.8567511636621313, "No": 0.14324741054863335}, "ground_truth": 1}, {"key": "40945179", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8973352957008496, "res": {"Yes": 0.8973352957008496, "No": 0.10265727152337802}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994511672038477, "res": {"Yes": 0.9994511672038477, "No": 0.0005484162385158336}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.13826120403761605, "res": {"No": 0.8617385849776178, "Yes": 0.13826120403761605}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984442140916071, "res": {"Yes": 0.9984442140916071, "No": 0.0015553697193062747}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980507695220429, "res": {"Yes": 0.9980507695220429, "No": 0.00194835412747254}, "ground_truth": 1}, {"key": "34152358", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9378379088241097, "res": {"Yes": 0.9378379088241097, "No": 0.06216130990667956}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996502945312168, "res": {"Yes": 0.9996502945312168, "No": 0.00034911247840219297}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4378790886613507, "res": {"No": 0.5621192067084809, "Yes": 0.4378790886613507}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.761742825199145, "res": {"Yes": 0.761742825199145, "No": 0.2382554170202761}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9864536400478169, "res": {"Yes": 0.9864536400478169, "No": 0.013545846635622132}, "ground_truth": 1}, {"key": "34136541", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9358293102297136, "res": {"Yes": 0.9358293102297136, "No": 0.0641687786781116}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7658260912037028, "res": {"Yes": 0.7658260912037028, "No": 0.23416415323873835}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9586716793649632, "res": {"Yes": 0.9586716793649632, "No": 0.04132767940460044}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7327373230885138, "res": {"Yes": 0.7327373230885138, "No": 0.26726035054625585}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9948347768788749, "res": {"Yes": 0.9948347768788749, "No": 0.005165148115784116}, "ground_truth": 1}, {"key": "37469603", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9461174152800752, "res": {"Yes": 0.9461174152800752, "No": 0.05388179571238886}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9859496451610386, "res": {"Yes": 0.9859496451610386, "No": 0.014049980094007576}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8928180234525471, "res": {"Yes": 0.8928180234525471, "No": 0.1071800015986361}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.978177299055577, "res": {"Yes": 0.978177299055577, "No": 0.02182107572147032}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9841414128594126, "res": {"Yes": 0.9841414128594126, "No": 0.015857425540589356}, "ground_truth": 1}, {"key": "37353611", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992543757160417, "res": {"Yes": 0.9992543757160417, "No": 0.000745149789546922}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.912761083085231, "res": {"Yes": 0.912761083085231, "No": 0.08723521393976183}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9950399830112423, "res": {"Yes": 0.9950399830112423, "No": 0.004959739796522117}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998965813680755, "res": {"Yes": 0.9998965813680755, "No": 0.00010265671501798375}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999933054575945, "res": {"Yes": 0.999933054575945, "No": 6.58149198430983e-05}, "ground_truth": 1}, {"key": "37211649", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999834495597365, "res": {"Yes": 0.999834495597365, "No": 0.00016513966294547404}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998843047282142, "res": {"Yes": 0.9998843047282142, "No": 0.00011442602655986099}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9992453302665525, "res": {"Yes": 0.9992453302665525, "No": 0.000754499079326743}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993563962418075, "res": {"Yes": 0.9993563962418075, "No": 0.0006435286562902683}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994374737272633, "res": {"Yes": 0.9994374737272633, "No": 0.0005623613180342383}, "ground_truth": 1}, {"key": "37320976", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996612574862052, "res": {"Yes": 0.9996612574862052, "No": 0.0003384707093769845}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997942159164498, "res": {"Yes": 0.9997942159164498, "No": 0.00020555292800257443}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9909470380665504, "res": {"Yes": 0.9909470380665504, "No": 0.009052245776097124}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993194896522671, "res": {"Yes": 0.9993194896522671, "No": 0.0006804001343399363}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9975236091274627, "res": {"Yes": 0.9975236091274627, "No": 0.002475822536979615}, "ground_truth": 1}, {"key": "34492412", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993118694005324, "res": {"Yes": 0.9993118694005324, "No": 0.0006879715999674606}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9617407069910029, "res": {"Yes": 0.9617407069910029, "No": 0.03825830569226987}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8226151550522518, "res": {"Yes": 0.8226151550522518, "No": 0.17738323810745668}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9852241857113282, "res": {"Yes": 0.9852241857113282, "No": 0.014774390036910424}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9858702759585716, "res": {"Yes": 0.9858702759585716, "No": 0.014128983839237368}, "ground_truth": 1}, {"key": "36655016", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9743596675213724, "res": {"Yes": 0.9743596675213724, "No": 0.025639516611833373}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.19405999794004994, "res": {"No": 0.8059381148551702, "Yes": 0.19405999794004994}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9911357868581903, "res": {"Yes": 0.9911357868581903, "No": 0.008864131622311205}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9308984815727265, "res": {"Yes": 0.9308984815727265, "No": 0.06910119186148694}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998026776706121, "res": {"Yes": 0.9998026776706121, "No": 0.0001972023892493934}, "ground_truth": 1}, {"key": "35220773", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992286691686822, "res": {"Yes": 0.9992286691686822, "No": 0.0007713008908707731}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997280920336735, "res": {"Yes": 0.9997280920336735, "No": 0.0002718617208947895}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9976459186058343, "res": {"Yes": 0.9976459186058343, "No": 0.002353354080752915}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.976089694196574, "res": {"Yes": 0.976089694196574, "No": 0.02390905551416451}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9977210242175267, "res": {"Yes": 0.9977210242175267, "No": 0.0022772083365879266}, "ground_truth": 1}, {"key": "31569808", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968931905517395, "res": {"Yes": 0.9968931905517395, "No": 0.0031060079335281563}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985485600593004, "res": {"Yes": 0.9985485600593004, "No": 0.001450662398951753}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9982472271037397, "res": {"Yes": 0.9982472271037397, "No": 0.0017526576252830427}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9970365651672387, "res": {"Yes": 0.9970365651672387, "No": 0.002963160037109464}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9878904232763539, "res": {"Yes": 0.9878904232763539, "No": 0.012109185283768305}, "ground_truth": 1}, {"key": "37696256", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9760157621066627, "res": {"Yes": 0.9760157621066627, "No": 0.023983701104186017}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999523644646081, "res": {"Yes": 0.9999523644646081, "No": 4.7491585974182035e-05}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.008061679253963705, "res": {"No": 0.9919373300953648, "Yes": 0.008061679253963705}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9849714322721771, "res": {"Yes": 0.9849714322721771, "No": 0.01502720581027794}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9302064576495441, "res": {"Yes": 0.9302064576495441, "No": 0.06978863533640763}, "ground_truth": 1}, {"key": "36874328", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9592779192385217, "res": {"Yes": 0.9592779192385217, "No": 0.04071096957992766}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7946946787352274, "res": {"Yes": 0.7946946787352274, "No": 0.20530403520237897}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9997907597337986, "res": {"Yes": 0.9997907597337986, "No": 0.00020896140251835902}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993519885801483, "res": {"Yes": 0.9993519885801483, "No": 0.0006478089728870223}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999030529040918, "res": {"Yes": 0.999030529040918, "No": 0.000968857515221959}, "ground_truth": 1}, {"key": "24532377", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9965228776398435, "res": {"Yes": 0.9965228776398435, "No": 0.0034758924944710717}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991527337329321, "res": {"Yes": 0.9991527337329321, "No": 0.0008469727806628221}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8394861924075334, "res": {"Yes": 0.8394861924075334, "No": 0.16051238087163855}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992075976167174, "res": {"Yes": 0.9992075976167174, "No": 0.000792036960453074}, "ground_truth": 1}, {"key": "39560618", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998430768937189, "res": {"Yes": 0.9998430768937189, "No": 0.00015650039876001444}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1439046430211838, "res": {"No": 0.8560944329998685, "Yes": 0.1439046430211838}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8639542352859474, "res": {"Yes": 0.8639542352859474, "No": 0.1360455803178694}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999537948404913, "res": {"Yes": 0.9999537948404913, "No": 4.6113813996321326e-05}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.875967175183082, "res": {"Yes": 0.875967175183082, "No": 0.1240287853993693}, "ground_truth": 1}, {"key": "34922693", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998584218565489, "res": {"Yes": 0.998584218565489, "No": 0.0014155685874667739}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971636117716492, "res": {"Yes": 0.9971636117716492, "No": 0.002835032154192209}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06980693631574636, "res": {"No": 0.9301876816216942, "Yes": 0.06980693631574636}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.47310132295268564, "res": {"No": 0.5268955223000042, "Yes": 0.47310132295268564}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.965737303789028, "res": {"Yes": 0.965737303789028, "No": 0.034256744977950594}, "ground_truth": 1}, {"key": "33629577", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9199416268758649, "res": {"Yes": 0.9199416268758649, "No": 0.08004761771057921}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.48996288286582634, "res": {"No": 0.5100349888646819, "Yes": 0.48996288286582634}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8927322188357201, "res": {"Yes": 0.8927322188357201, "No": 0.10726704565033417}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9759833950326416, "res": {"Yes": 0.9759833950326416, "No": 0.024014398284464725}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9958917119002785, "res": {"Yes": 0.9958917119002785, "No": 0.004107948185776978}, "ground_truth": 1}, {"key": "32284359", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9923576573433821, "res": {"Yes": 0.9923576573433821, "No": 0.00764155929824244}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9823954697605335, "res": {"Yes": 0.9823954697605335, "No": 0.017601685754836272}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9990907381892707, "res": {"Yes": 0.9990907381892707, "No": 0.000908806825111254}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8993473098756396, "res": {"Yes": 0.8993473098756396, "No": 0.10065101927727733}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6892944781022207, "res": {"Yes": 0.6892944781022207, "No": 0.31070238077370155}, "ground_truth": 1}, {"key": "28082962", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995961029883677, "res": {"Yes": 0.9995961029883677, "No": 0.000403452418153311}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994065133429176, "res": {"Yes": 0.9994065133429176, "No": 0.0005928625342028854}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9742586170487708, "res": {"Yes": 0.9742586170487708, "No": 0.02574063518903357}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9907094632147194, "res": {"Yes": 0.9907094632147194, "No": 0.009289073147231465}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9955795594354243, "res": {"Yes": 0.9955795594354243, "No": 0.004419875724132132}, "ground_truth": 1}, {"key": "24796803", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.981579876999329, "res": {"Yes": 0.981579876999329, "No": 0.018416683743572665}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9794021798666391, "res": {"Yes": 0.9794021798666391, "No": 0.020590783627946353}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.02366812908959291, "res": {"No": 0.9763280375424098, "Yes": 0.02366812908959291}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.21251406597176647, "res": {"No": 0.7874739407035256, "Yes": 0.21251406597176647}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.02436714184309616, "res": {"No": 0.9756282163603766, "Yes": 0.02436714184309616}, "ground_truth": 1}, {"key": "35466150", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00048196069156933324, "res": {"No": 0.99951713165846, "Yes": 0.00048196069156933324}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.03596784262994632, "res": {"No": 0.9640306849665685, "Yes": 0.03596784262994632}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998681023692575, "res": {"Yes": 0.9998681023692575, "No": 0.0001317858897064418}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984568117414185, "res": {"Yes": 0.9984568117414185, "No": 0.0015430967577761139}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988904068542298, "res": {"Yes": 0.9988904068542298, "No": 0.0011094254614028526}, "ground_truth": 1}, {"key": "35754289", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9488065512386731, "res": {"Yes": 0.9488065512386731, "No": 0.05119303455700344}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1956443321653243, "res": {"No": 0.8043548189925761, "Yes": 0.1956443321653243}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5203255008847658, "res": {"Yes": 0.5203255008847658, "No": 0.4796737469648494}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.995223322185385, "res": {"Yes": 0.995223322185385, "No": 0.004776441336601483}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9559296638653433, "res": {"Yes": 0.9559296638653433, "No": 0.0440686911460881}, "ground_truth": 1}, {"key": "36678662", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6556747637155815, "res": {"Yes": 0.6556747637155815, "No": 0.3443242425473783}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8309798685431304, "res": {"Yes": 0.8309798685431304, "No": 0.16901841592930072}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9987943044356663, "res": {"Yes": 0.9987943044356663, "No": 0.0012056432946594019}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9979032100417703, "res": {"Yes": 0.9979032100417703, "No": 0.0020966934977514695}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999002763027385, "res": {"Yes": 0.9999002763027385, "No": 9.95232771453895e-05}, "ground_truth": 1}, {"key": "35399671", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9891740430746242, "res": {"Yes": 0.9891740430746242, "No": 0.0108256755562169}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9965673898230519, "res": {"Yes": 0.9965673898230519, "No": 0.0034325906889537843}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.008457281438268462, "res": {"No": 0.9915409037110522, "Yes": 0.008457281438268462}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9030606886646171, "res": {"Yes": 0.9030606886646171, "No": 0.09693414001500612}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.36581662343638777, "res": {"No": 0.6341780677632027, "Yes": 0.36581662343638777}, "ground_truth": 1}, {"key": "36888180", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9670452155874673, "res": {"Yes": 0.9670452155874673, "No": 0.03295303872431824}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.13827966314047277, "res": {"No": 0.8617155682474029, "Yes": 0.13827966314047277}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9994038960805794, "res": {"Yes": 0.9994038960805794, "No": 0.0005959629841252821}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9799529663398608, "res": {"Yes": 0.9799529663398608, "No": 0.020046955142077057}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991549931195635, "res": {"Yes": 0.9991549931195635, "No": 0.0008449320060987505}, "ground_truth": 1}, {"key": "28061069", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997021203349599, "res": {"Yes": 0.9997021203349599, "No": 0.0002977709473685819}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983010342790257, "res": {"Yes": 0.9983010342790257, "No": 0.0016988449500360144}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9392924311338752, "res": {"Yes": 0.9392924311338752, "No": 0.06070704044991378}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990733650215952, "res": {"Yes": 0.9990733650215952, "No": 0.0009264856507004233}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976373746032445, "res": {"Yes": 0.9976373746032445, "No": 0.0023622115530441867}, "ground_truth": 1}, {"key": "22259982", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997166553096911, "res": {"Yes": 0.9997166553096911, "No": 0.00028312077063303984}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9848978872011687, "res": {"Yes": 0.9848978872011687, "No": 0.015101297676692226}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9826520951458135, "res": {"Yes": 0.9826520951458135, "No": 0.017345893265531306}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8712136582260444, "res": {"Yes": 0.8712136582260444, "No": 0.12878447606777557}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.544931271287772, "res": {"Yes": 0.544931271287772, "No": 0.4550657613659928}, "ground_truth": 1}, {"key": "34026805", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9519179736835974, "res": {"Yes": 0.9519179736835974, "No": 0.048078061874413686}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0019037251633729079, "res": {"No": 0.9980946013811264, "Yes": 0.0019037251633729079}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9991733241249329, "res": {"Yes": 0.9991733241249329, "No": 0.000826184040450076}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996776985102879, "res": {"Yes": 0.9996776985102879, "No": 0.0003217602033330571}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999309090568892, "res": {"Yes": 0.9999309090568892, "No": 6.862085916441963e-05}, "ground_truth": 1}, {"key": "36713809", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999008722634788, "res": {"Yes": 0.9999008722634788, "No": 9.89981890917015e-05}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984249588812335, "res": {"Yes": 0.9984249588812335, "No": 0.0015744776696911707}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 6.396413642685531e-05, "res": {"No": 0.9999352000996042, "Yes": 6.396413642685531e-05}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9823725713713991, "res": {"Yes": 0.9823725713713991, "No": 0.017626539263463234}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987419889601543, "res": {"Yes": 0.9987419889601543, "No": 0.0012571387168166675}, "ground_truth": 1}, {"key": "39726411", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999187367594702, "res": {"Yes": 0.999187367594702, "No": 0.0008120813809335488}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9970392877787045, "res": {"Yes": 0.9970392877787045, "No": 0.0029603330502481554}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.016888097417630126, "res": {"No": 0.9831114685273555, "Yes": 0.016888097417630126}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9625719234015666, "res": {"Yes": 0.9625719234015666, "No": 0.03742490077434749}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7474638022301472, "res": {"Yes": 0.7474638022301472, "No": 0.25253394592397616}, "ground_truth": 1}, {"key": "37069841", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6572222090159131, "res": {"Yes": 0.6572222090159131, "No": 0.34277384270423283}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 7.579495577669131e-07, "res": {"No": 0.9999984951481323, "Yes": 7.579495577669131e-07}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7649959035550029, "res": {"Yes": 0.7649959035550029, "No": 0.23499876974014516}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9922051933026812, "res": {"Yes": 0.9922051933026812, "No": 0.0077919408795299955}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8604910537124381, "res": {"Yes": 0.8604910537124381, "No": 0.13948025903896585}, "ground_truth": 1}, {"key": "38894693", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8675107285786149, "res": {"Yes": 0.8675107285786149, "No": 0.13248150873656142}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.269119973679407, "res": {"No": 0.7308298570626242, "Yes": 0.269119973679407}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9481809712526275, "res": {"Yes": 0.9481809712526275, "No": 0.051818642533192606}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6159745815607921, "res": {"Yes": 0.6159745815607921, "No": 0.38402431810543436}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7979777852120122, "res": {"Yes": 0.7979777852120122, "No": 0.2020207023401345}, "ground_truth": 1}, {"key": "33946032", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9925709024853405, "res": {"Yes": 0.9925709024853405, "No": 0.007428477899404961}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7410068570130894, "res": {"Yes": 0.7410068570130894, "No": 0.25899207919731365}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5096852503293577, "res": {"Yes": 0.5096852503293577, "No": 0.4903128608969948}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9063977741275568, "res": {"Yes": 0.9063977741275568, "No": 0.09360152527109557}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968683126947675, "res": {"Yes": 0.9968683126947675, "No": 0.0031313658368843254}, "ground_truth": 1}, {"key": "39035311", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9941267966885454, "res": {"Yes": 0.9941267966885454, "No": 0.005872657628420235}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9887656054657947, "res": {"Yes": 0.9887656054657947, "No": 0.011233139338621141}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9984733298483168, "res": {"Yes": 0.9984733298483168, "No": 0.0015257843092236472}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9987366352180719, "res": {"Yes": 0.9987366352180719, "No": 0.0012629049446573936}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9972870220941958, "res": {"Yes": 0.9972870220941958, "No": 0.002712237605755653}, "ground_truth": 1}, {"key": "27680038", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994265205022627, "res": {"Yes": 0.9994265205022627, "No": 0.0005728060386714884}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988921893757513, "res": {"Yes": 0.9988921893757513, "No": 0.0011073001763488464}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 1.7270529606584572e-05, "res": {"No": 0.9999824028078323, "Yes": 1.7270529606584572e-05}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.014274279465292108, "res": {"No": 0.98572327295804, "Yes": 0.014274279465292108}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.045950019766795504, "res": {"No": 0.954049444748582, "Yes": 0.045950019766795504}, "ground_truth": 1}, {"key": "36901907", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0546837985944081, "res": {"No": 0.945313301930559, "Yes": 0.0546837985944081}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.24841779326167532, "res": {"No": 0.7515810534872368, "Yes": 0.24841779326167532}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9983312134752799, "res": {"Yes": 0.9983312134752799, "No": 0.0016683896486803637}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.968669190550346, "res": {"Yes": 0.968669190550346, "No": 0.03133047853863968}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990763423845482, "res": {"Yes": 0.9990763423845482, "No": 0.0009233166649635436}, "ground_truth": 1}, {"key": "21530542", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988700678546135, "res": {"Yes": 0.9988700678546135, "No": 0.0011295499499169314}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982025630281547, "res": {"Yes": 0.9982025630281547, "No": 0.0017971270005993337}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6613274076845377, "res": {"Yes": 0.6613274076845377, "No": 0.33866969419486853}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.058155809476194066, "res": {"No": 0.9418437638000149, "Yes": 0.058155809476194066}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5364439799379024, "res": {"Yes": 0.5364439799379024, "No": 0.46354925133451}, "ground_truth": 1}, {"key": "38192532", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7487941697301813, "res": {"Yes": 0.7487941697301813, "No": 0.2512024226819717}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.29783319426031835, "res": {"No": 0.7021654633163549, "Yes": 0.29783319426031835}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9595114119141038, "res": {"Yes": 0.9595114119141038, "No": 0.040484524054824396}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9493426939185305, "res": {"Yes": 0.9493426939185305, "No": 0.05065668868736421}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3854042328721659, "res": {"No": 0.614592784199383, "Yes": 0.3854042328721659}, "ground_truth": 1}, {"key": "34102400", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7798976623668729, "res": {"Yes": 0.7798976623668729, "No": 0.22009605814328215}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.45301866103944777, "res": {"No": 0.5469787092927617, "Yes": 0.45301866103944777}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8048972334688376, "res": {"Yes": 0.8048972334688376, "No": 0.19510230831063943}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8373418239884276, "res": {"Yes": 0.8373418239884276, "No": 0.16265712846531577}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9369291193279297, "res": {"Yes": 0.9369291193279297, "No": 0.06306338167467102}, "ground_truth": 1}, {"key": "36133399", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3491387399858663, "res": {"No": 0.6508603147978778, "Yes": 0.3491387399858663}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1016564386038809, "res": {"No": 0.8983413234214555, "Yes": 0.1016564386038809}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4324669810143855, "res": {"No": 0.5675310599130248, "Yes": 0.4324669810143855}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9467897427484593, "res": {"Yes": 0.9467897427484593, "No": 0.053207809409286246}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.988100578810593, "res": {"Yes": 0.988100578810593, "No": 0.011896131687358544}, "ground_truth": 1}, {"key": "34314544", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9179353643915679, "res": {"Yes": 0.9179353643915679, "No": 0.08206122204400132}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8081386650696764, "res": {"Yes": 0.8081386650696764, "No": 0.19182896715819572}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9382861523762827, "res": {"Yes": 0.9382861523762827, "No": 0.061711060597233795}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999801379802525, "res": {"Yes": 0.9999801379802525, "No": 1.8982975628802497e-05}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992162889620424, "res": {"Yes": 0.9992162889620424, "No": 0.0007823682659078287}, "ground_truth": 1}, {"key": "33460074", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989552333491094, "res": {"Yes": 0.9989552333491094, "No": 0.0010441943999577004}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995277320236443, "res": {"Yes": 0.9995277320236443, "No": 0.0004711853579828909}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.14143742299980258, "res": {"No": 0.8585590484970095, "Yes": 0.14143742299980258}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9557615076869449, "res": {"Yes": 0.9557615076869449, "No": 0.04423760764370665}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0065238910124236285, "res": {"No": 0.9934749953008969, "Yes": 0.0065238910124236285}, "ground_truth": 1}, {"key": "36191495", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.03842612546772822, "res": {"No": 0.9615734623228605, "Yes": 0.03842612546772822}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9898307124504926, "res": {"Yes": 0.9898307124504926, "No": 0.01016655670496963}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7326770432685877, "res": {"Yes": 0.7326770432685877, "No": 0.2673219611574069}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9943676661038118, "res": {"Yes": 0.9943676661038118, "No": 0.005631277236212559}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9785885603572577, "res": {"Yes": 0.9785885603572577, "No": 0.02141120705233178}, "ground_truth": 1}, {"key": "39532668", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9157129882604519, "res": {"Yes": 0.9157129882604519, "No": 0.08428669968736512}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.988510194820265, "res": {"Yes": 0.988510194820265, "No": 0.011485820550340625}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 1.1674706347127287e-06, "res": {"No": 0.9999978991308068, "Yes": 1.1674706347127287e-06}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991429819898906, "res": {"Yes": 0.9991429819898906, "No": 0.0008564385399365926}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9737508255428531, "res": {"Yes": 0.9737508255428531, "No": 0.0262475533500712}, "ground_truth": 1}, {"key": "20328247", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980970889354013, "res": {"Yes": 0.9980970889354013, "No": 0.0019022642344143188}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9903148461490501, "res": {"Yes": 0.9903148461490501, "No": 0.009684660857801033}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9652701197241135, "res": {"Yes": 0.9652701197241135, "No": 0.03472370444628505}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9960080656382064, "res": {"Yes": 0.9960080656382064, "No": 0.003988775449789291}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997912351176413, "res": {"Yes": 0.997912351176413, "No": 0.0020868897068157966}, "ground_truth": 1}, {"key": "39112675", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9896214457588324, "res": {"Yes": 0.9896214457588324, "No": 0.010375645478556595}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9164801045611777, "res": {"Yes": 0.9164801045611777, "No": 0.0834546924314836}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0001952603034668353, "res": {"No": 0.9998044653793863, "Yes": 0.0001952603034668353}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9499962611755303, "res": {"Yes": 0.9499962611755303, "No": 0.0500019037139399}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9964686673729863, "res": {"Yes": 0.9964686673729863, "No": 0.0035313275579409555}, "ground_truth": 1}, {"key": "31620300", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9938084461571617, "res": {"Yes": 0.9938084461571617, "No": 0.006190756416461249}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9674007493418043, "res": {"Yes": 0.9674007493418043, "No": 0.032598011154538635}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06858569456736238, "res": {"No": 0.9314139323895005, "Yes": 0.06858569456736238}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9983189743091264, "res": {"Yes": 0.9983189743091264, "No": 0.0016802301515158665}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9919894161081476, "res": {"Yes": 0.9919894161081476, "No": 0.00800983594007412}, "ground_truth": 1}, {"key": "37518509", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989617754284589, "res": {"Yes": 0.9989617754284589, "No": 0.0010381246653051437}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.972565643523935, "res": {"Yes": 0.972565643523935, "No": 0.02743413330009759}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3431328805457259, "res": {"No": 0.6568624520672364, "Yes": 0.3431328805457259}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9911943379519047, "res": {"Yes": 0.9911943379519047, "No": 0.008805198440820209}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9955885421920811, "res": {"Yes": 0.9955885421920811, "No": 0.004407523552386515}, "ground_truth": 1}, {"key": "35454095", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980323840991361, "res": {"Yes": 0.9980323840991361, "No": 0.0019674834291408512}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9826470305699665, "res": {"Yes": 0.9826470305699665, "No": 0.017352222201722344}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.999920539107184, "res": {"Yes": 0.999920539107184, "No": 7.857499805767657e-05}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997981488446863, "res": {"Yes": 0.9997981488446863, "No": 0.00020159476285626542}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999790521363714, "res": {"Yes": 0.999790521363714, "No": 0.00020887031520533847}, "ground_truth": 1}, {"key": "38542788", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991441730689494, "res": {"Yes": 0.9991441730689494, "No": 0.000855652433421417}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984539553602573, "res": {"Yes": 0.9984539553602573, "No": 0.001545454248301207}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9132863693590543, "res": {"Yes": 0.9132863693590543, "No": 0.08671225983018219}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994565284342001, "res": {"Yes": 0.9994565284342001, "No": 0.0005428700962916022}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976735622607503, "res": {"Yes": 0.9976735622607503, "No": 0.0023238011670487016}, "ground_truth": 1}, {"key": "23944937", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9911137680301355, "res": {"Yes": 0.9911137680301355, "No": 0.008884684742474632}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995166550788102, "res": {"Yes": 0.9995166550788102, "No": 0.000482359437920151}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.24336887074833063, "res": {"No": 0.7566273794155588, "Yes": 0.24336887074833063}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9569397468122927, "res": {"Yes": 0.9569397468122927, "No": 0.043058156513660156}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.44860727944461987, "res": {"No": 0.5513881728132365, "Yes": 0.44860727944461987}, "ground_truth": 1}, {"key": "31753944", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9876024458054034, "res": {"Yes": 0.9876024458054034, "No": 0.012397178160130778}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9942067897346843, "res": {"Yes": 0.9942067897346843, "No": 0.005792096286421723}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977343155464535, "res": {"Yes": 0.9977343155464535, "No": 0.002265481409059498}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9958962051746406, "res": {"Yes": 0.9958962051746406, "No": 0.0041037528280940165}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995147487424925, "res": {"Yes": 0.9995147487424925, "No": 0.00048511736820703894}, "ground_truth": 1}, {"key": "35527214", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.961350425266525, "res": {"Yes": 0.961350425266525, "No": 0.03864916918654713}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9859525433642802, "res": {"Yes": 0.9859525433642802, "No": 0.014047286970967642}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08415099788567547, "res": {"No": 0.9158479514069493, "Yes": 0.08415099788567547}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0055093496149412405, "res": {"No": 0.994488379621916, "Yes": 0.0055093496149412405}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8642485050047064, "res": {"Yes": 0.8642485050047064, "No": 0.13574920181516512}, "ground_truth": 1}, {"key": "40400404", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8499860171881212, "res": {"Yes": 0.8499860171881212, "No": 0.15001139816592088}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.4103887778169722, "res": {"No": 0.5896042676033378, "Yes": 0.4103887778169722}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0005805404952500769, "res": {"No": 0.9994191378657657, "Yes": 0.0005805404952500769}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9966754933507148, "res": {"Yes": 0.9966754933507148, "No": 0.0033243217853857012}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991426247563727, "res": {"Yes": 0.9991426247563727, "No": 0.0008572161106809461}, "ground_truth": 1}, {"key": "21713119", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980854511911925, "res": {"Yes": 0.9980854511911925, "No": 0.001913989637538982}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975536202761915, "res": {"Yes": 0.9975536202761915, "No": 0.002446109440688429}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9839210489064896, "res": {"Yes": 0.9839210489064896, "No": 0.01607873640656982}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997933816685082, "res": {"Yes": 0.9997933816685082, "No": 0.00020645563732472763}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996279070137725, "res": {"Yes": 0.9996279070137725, "No": 0.0003718739891203153}, "ground_truth": 1}, {"key": "28730678", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9873842611248296, "res": {"Yes": 0.9873842611248296, "No": 0.012615441493481601}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999684368122225, "res": {"Yes": 0.999684368122225, "No": 0.0003155122656110557}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.07088715730527495, "res": {"No": 0.9291110873275822, "Yes": 0.07088715730527495}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.25217941008536093, "res": {"No": 0.7478194927372287, "Yes": 0.25217941008536093}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6287141167324807, "res": {"Yes": 0.6287141167324807, "No": 0.371283558382845}, "ground_truth": 1}, {"key": "36823733", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8716252819192744, "res": {"Yes": 0.8716252819192744, "No": 0.1283733710257374}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.12641674876440792, "res": {"No": 0.87357838215445, "Yes": 0.12641674876440792}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996430293791788, "res": {"Yes": 0.9996430293791788, "No": 0.0003567745458178005}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999224462174501, "res": {"Yes": 0.9999224462174501, "No": 7.746858954137618e-05}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999914621674475, "res": {"Yes": 0.9999914621674475, "No": 8.453736711199522e-06}, "ground_truth": 1}, {"key": "35988862", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999782897630131, "res": {"Yes": 0.999782897630131, "No": 0.00021698702474790306}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992656880390844, "res": {"Yes": 0.9992656880390844, "No": 0.0007341596839100619}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9047410851244349, "res": {"Yes": 0.9047410851244349, "No": 0.09525320664287536}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6112332508749843, "res": {"Yes": 0.6112332508749843, "No": 0.38876512869059776}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9705421559156099, "res": {"Yes": 0.9705421559156099, "No": 0.029456343296699588}, "ground_truth": 1}, {"key": "40499665", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7456613546756482, "res": {"Yes": 0.7456613546756482, "No": 0.25433804779272684}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9270392160963749, "res": {"Yes": 0.9270392160963749, "No": 0.07295949900116395}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.07023103300740827, "res": {"No": 0.9297682848078219, "Yes": 0.07023103300740827}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.971816834647256, "res": {"Yes": 0.971816834647256, "No": 0.028182498902167303}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999162481273839, "res": {"Yes": 0.9999162481273839, "No": 8.301950315496214e-05}, "ground_truth": 1}, {"key": "32829820", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993113929587261, "res": {"Yes": 0.9993113929587261, "No": 0.0006885094599142345}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9934968804052265, "res": {"Yes": 0.9934968804052265, "No": 0.006502789762027087}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9411101781620193, "res": {"Yes": 0.9411101781620193, "No": 0.058889315821465366}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9494159717622995, "res": {"Yes": 0.9494159717622995, "No": 0.05058336559087345}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9967293766790625, "res": {"Yes": 0.9967293766790625, "No": 0.003270602697153678}, "ground_truth": 1}, {"key": "20583553", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9880139933745535, "res": {"Yes": 0.9880139933745535, "No": 0.011983542845571734}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9880434405824321, "res": {"Yes": 0.9880434405824321, "No": 0.011954266918826159}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7758105695527899, "res": {"Yes": 0.7758105695527899, "No": 0.2241843218709473}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8830823474555011, "res": {"Yes": 0.8830823474555011, "No": 0.11691307137867608}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9611892645323258, "res": {"Yes": 0.9611892645323258, "No": 0.0388096248488805}, "ground_truth": 1}, {"key": "30501550", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.716762969148556, "res": {"Yes": 0.716762969148556, "No": 0.2832299973290284}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9589129863004321, "res": {"Yes": 0.9589129863004321, "No": 0.041086223841731905}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9975854088263395, "res": {"Yes": 0.9975854088263395, "No": 0.002413680060728044}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.995954973747732, "res": {"Yes": 0.995954973747732, "No": 0.0040445782436569246}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9809029077959104, "res": {"Yes": 0.9809029077959104, "No": 0.019096202226672115}, "ground_truth": 1}, {"key": "38755897", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990715786000898, "res": {"Yes": 0.9990715786000898, "No": 0.0009278068338721116}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9885351372241727, "res": {"Yes": 0.9885351372241727, "No": 0.01146422456426206}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9921520274118579, "res": {"Yes": 0.9921520274118579, "No": 0.007846764482395824}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.986826140014034, "res": {"Yes": 0.986826140014034, "No": 0.013171674846186069}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980963749968089, "res": {"Yes": 0.9980963749968089, "No": 0.0019028212989324219}, "ground_truth": 1}, {"key": "35507201", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989189478583407, "res": {"Yes": 0.9989189478583407, "No": 0.0010807427961946768}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999218909450165, "res": {"Yes": 0.999218909450165, "No": 0.0007803820113749611}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9987256971143401, "res": {"Yes": 0.9987256971143401, "No": 0.0012740977473638087}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992329535606399, "res": {"Yes": 0.9992329535606399, "No": 0.0007665175221238428}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9693869292519125, "res": {"Yes": 0.9693869292519125, "No": 0.030611852757689073}, "ground_truth": 1}, {"key": "36453511", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9925320199766379, "res": {"Yes": 0.9925320199766379, "No": 0.0074663688182338905}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9929542792979972, "res": {"Yes": 0.9929542792979972, "No": 0.007044532464448363}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.02499901137239662, "res": {"No": 0.9749996509347452, "Yes": 0.02499901137239662}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5572462144554376, "res": {"Yes": 0.5572462144554376, "No": 0.4427409247448344}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8095836223211157, "res": {"Yes": 0.8095836223211157, "No": 0.1904126347205697}, "ground_truth": 1}, {"key": "38066835", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8048234116801027, "res": {"Yes": 0.8048234116801027, "No": 0.19516555121672224}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977073763852096, "res": {"Yes": 0.9977073763852096, "No": 0.0022920710075570497}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7134680373894878, "res": {"Yes": 0.7134680373894878, "No": 0.28653055479922984}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9790299886504381, "res": {"Yes": 0.9790299886504381, "No": 0.020968195275076207}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985816072711717, "res": {"Yes": 0.9985816072711717, "No": 0.0014167043288453392}, "ground_truth": 1}, {"key": "39697181", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9977107029466896, "res": {"Yes": 0.9977107029466896, "No": 0.0022879638623883617}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996685228307005, "res": {"Yes": 0.9996685228307005, "No": 0.00033093899655853813}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.32347598588217685, "res": {"No": 0.6765236517811276, "Yes": 0.32347598588217685}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.38367965742877447, "res": {"No": 0.6163145084976627, "Yes": 0.38367965742877447}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1716651675058971, "res": {"No": 0.8283317256388939, "Yes": 0.1716651675058971}, "ground_truth": 1}, {"key": "21820893", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.36365800489066724, "res": {"No": 0.6363337112674018, "Yes": 0.36365800489066724}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.917479360201162, "res": {"Yes": 0.917479360201162, "No": 0.08251914103556077}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 1.652718429039141e-05, "res": {"No": 0.999983237218497, "Yes": 1.652718429039141e-05}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998582098131789, "res": {"Yes": 0.9998582098131789, "No": 0.00013677148739152294}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.31642788970236935, "res": {"No": 0.6834496640047686, "Yes": 0.31642788970236935}, "ground_truth": 1}, {"key": "40519933", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2664880704947793, "res": {"No": 0.7334907149750082, "Yes": 0.2664880704947793}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.958894452609343, "res": {"Yes": 0.958894452609343, "No": 0.04110204508330455}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.006006443315742758, "res": {"No": 0.9939901474468393, "Yes": 0.006006443315742758}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9925512817361846, "res": {"Yes": 0.9925512817361846, "No": 0.007445577850063703}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996078921243943, "res": {"Yes": 0.9996078921243943, "No": 0.00039130666340579065}, "ground_truth": 1}, {"key": "30446033", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968479325285663, "res": {"Yes": 0.9968479325285663, "No": 0.0031487781193996664}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.998172975245398, "res": {"Yes": 0.998172975245398, "No": 0.0018261049921922204}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 2.1461521863158657e-06, "res": {"No": 0.9999976607241361, "Yes": 2.1461521863158657e-06}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999033145265532, "res": {"Yes": 0.999033145265532, "No": 0.0009665636551249246}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9972627139181994, "res": {"Yes": 0.9972627139181994, "No": 0.002737262351076713}, "ground_truth": 1}, {"key": "40216291", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984137970517977, "res": {"Yes": 0.9984137970517977, "No": 0.0015856534267225707}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9960221397300131, "res": {"Yes": 0.9960221397300131, "No": 0.003977464989213987}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8965327729964954, "res": {"Yes": 0.8965327729964954, "No": 0.10346575402652612}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994274736258069, "res": {"Yes": 0.9994274736258069, "No": 0.0005722409008003998}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976742760964394, "res": {"Yes": 0.9976742760964394, "No": 0.002325302362526228}, "ground_truth": 1}, {"key": "33479118", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99003620085682, "res": {"Yes": 0.99003620085682, "No": 0.009963626173497801}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9911782965925463, "res": {"Yes": 0.9911782965925463, "No": 0.008820554874510627}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9463066539015145, "res": {"Yes": 0.9463066539015145, "No": 0.05369147727638702}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8199225454118346, "res": {"Yes": 0.8199225454118346, "No": 0.18007185739574552}, "ground_truth": 1}, {"key": "22297373", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9732992394147096, "res": {"Yes": 0.9732992394147096, "No": 0.026698593309534484}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8068266836586491, "res": {"Yes": 0.8068266836586491, "No": 0.19316917879047493}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9140306263936847, "res": {"Yes": 0.9140306263936847, "No": 0.08596646505469116}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8650293603717457, "res": {"Yes": 0.8650293603717457, "No": 0.1349673070326698}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9894109944604166, "res": {"Yes": 0.9894109944604166, "No": 0.010587523493730534}, "ground_truth": 1}, {"key": "36463668", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9891395096332517, "res": {"Yes": 0.9891395096332517, "No": 0.010859956174301563}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9818565389325576, "res": {"Yes": 0.9818565389325576, "No": 0.018141805641974124}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998559452768782, "res": {"Yes": 0.9998559452768782, "No": 0.00014389610670447871}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999406831293152, "res": {"Yes": 0.9999406831293152, "No": 5.918277625763698e-05}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999895549275502, "res": {"Yes": 0.9999895549275502, "No": 1.01571466174234e-05}, "ground_truth": 1}, {"key": "35264615", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999023025627055, "res": {"Yes": 0.9999023025627055, "No": 9.7454982941836e-05}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999462853826817, "res": {"Yes": 0.9999462853826817, "No": 5.3485605304197716e-05}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7544711792346281, "res": {"Yes": 0.7544711792346281, "No": 0.245527505334733}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9970027921226475, "res": {"Yes": 0.9970027921226475, "No": 0.002996809668514868}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980320271030162, "res": {"Yes": 0.9980320271030162, "No": 0.001967114954003346}, "ground_truth": 1}, {"key": "39898482", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968616798541418, "res": {"Yes": 0.9968616798541418, "No": 0.0031380772731699367}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988216592892679, "res": {"Yes": 0.9988216592892679, "No": 0.0011780968282200132}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9997697881628126, "res": {"Yes": 0.9997697881628126, "No": 0.00022978074185490174}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9777101959687832, "res": {"Yes": 0.9777101959687832, "No": 0.022288821594165877}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9910252466928663, "res": {"Yes": 0.9910252466928663, "No": 0.008972239217561536}, "ground_truth": 1}, {"key": "37228721", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996507711745873, "res": {"Yes": 0.9996507711745873, "No": 0.0003487532171738475}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987216529825628, "res": {"Yes": 0.9987216529825628, "No": 0.0012778355614081996}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.07294135622990948, "res": {"No": 0.9270526397214108, "Yes": 0.07294135622990948}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9689993915567293, "res": {"Yes": 0.9689993915567293, "No": 0.03099683117137702}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9845504016875796, "res": {"Yes": 0.9845504016875796, "No": 0.015447478389412747}, "ground_truth": 1}, {"key": "24535799", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.969164175191859, "res": {"Yes": 0.969164175191859, "No": 0.03083367938184111}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9945224537643016, "res": {"Yes": 0.9945224537643016, "No": 0.00547599272544513}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9925955639105764, "res": {"Yes": 0.9925955639105764, "No": 0.007403880680103103}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993741353350463, "res": {"Yes": 0.9993741353350463, "No": 0.0006255226610603271}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998828744557322, "res": {"Yes": 0.9998828744557322, "No": 0.00011693843011638443}, "ground_truth": 1}, {"key": "35177759", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9286959510627283, "res": {"Yes": 0.9286959510627283, "No": 0.07130286286383637}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983649564425305, "res": {"Yes": 0.9983649564425305, "No": 0.001634790364965376}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9340234294534367, "res": {"Yes": 0.9340234294534367, "No": 0.06597544180918594}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997238055187202, "res": {"Yes": 0.9997238055187202, "No": 0.0002758636047735926}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.983836007365963, "res": {"Yes": 0.983836007365963, "No": 0.01616208357667988}, "ground_truth": 1}, {"key": "34364829", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978922918428978, "res": {"Yes": 0.9978922918428978, "No": 0.002106170309145319}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991321475020006, "res": {"Yes": 0.9991321475020006, "No": 0.0008658074657878346}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.978441774275799, "res": {"Yes": 0.978441774275799, "No": 0.02155738564073634}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999852131313652, "res": {"Yes": 0.999852131313652, "No": 0.00014736574500896966}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999048055962748, "res": {"Yes": 0.9999048055962748, "No": 9.442006069755147e-05}, "ground_truth": 1}, {"key": "38090732", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999884821053314, "res": {"Yes": 0.9999884821053314, "No": 1.0952322759956289e-05}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996055089920477, "res": {"Yes": 0.9996055089920477, "No": 0.0003936684107851171}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0008898007470695714, "res": {"No": 0.9991083497565357, "Yes": 0.0008898007470695714}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9944752973127794, "res": {"Yes": 0.9944752973127794, "No": 0.00552428362841661}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7826680494068566, "res": {"Yes": 0.7826680494068566, "No": 0.21732994420368662}, "ground_truth": 1}, {"key": "30651479", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9639756278543113, "res": {"Yes": 0.9639756278543113, "No": 0.036022494083563686}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984908043828212, "res": {"Yes": 0.9984908043828212, "No": 0.0015084550464121679}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.793111628432477, "res": {"Yes": 0.793111628432477, "No": 0.20688686107352258}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999690683948077, "res": {"Yes": 0.999690683948077, "No": 0.00030858908131883004}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996277878481368, "res": {"Yes": 0.9996277878481368, "No": 0.00037162421090941204}, "ground_truth": 1}, {"key": "39380921", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9957554065591746, "res": {"Yes": 0.9957554065591746, "No": 0.004243914094799258}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997571555714829, "res": {"Yes": 0.9997571555714829, "No": 0.00024170151552534543}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9968426033937637, "res": {"Yes": 0.9968426033937637, "No": 0.003156591098398839}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9955077203095217, "res": {"Yes": 0.9955077203095217, "No": 0.004491776493100546}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988379528003616, "res": {"Yes": 0.9988379528003616, "No": 0.0011611441775968025}, "ground_truth": 1}, {"key": "39037490", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9972735063536872, "res": {"Yes": 0.9972735063536872, "No": 0.002725652581739897}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.998700491293656, "res": {"Yes": 0.998700491293656, "No": 0.0012983868106132292}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8346915446365358, "res": {"Yes": 0.8346915446365358, "No": 0.16530683928933165}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.3521242791253674, "res": {"No": 0.647873109809477, "Yes": 0.3521242791253674}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.974517690292707, "res": {"Yes": 0.974517690292707, "No": 0.025481703351060297}, "ground_truth": 1}, {"key": "35917499", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7993489700951311, "res": {"Yes": 0.7993489700951311, "No": 0.20064598348251816}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9529843636168007, "res": {"Yes": 0.9529843636168007, "No": 0.04701443484798113}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3359903969275947, "res": {"No": 0.664009116454369, "Yes": 0.3359903969275947}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9977499819938991, "res": {"Yes": 0.9977499819938991, "No": 0.00224958460457298}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.994749949541406, "res": {"Yes": 0.994749949541406, "No": 0.0052490823926877985}, "ground_truth": 1}, {"key": "34908073", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9118525496449444, "res": {"Yes": 0.9118525496449444, "No": 0.08814640092116287}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987939471670075, "res": {"Yes": 0.9987939471670075, "No": 0.0012058125788614452}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.013431279516190877, "res": {"No": 0.986567914496596, "Yes": 0.013431279516190877}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9983913364884552, "res": {"Yes": 0.9983913364884552, "No": 0.0016084755691377697}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992886556254563, "res": {"Yes": 0.9992886556254563, "No": 0.0007111896690164039}, "ground_truth": 1}, {"key": "36344759", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997033120205857, "res": {"Yes": 0.9997033120205857, "No": 0.00029657275209372274}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9915999819738045, "res": {"Yes": 0.9915999819738045, "No": 0.00839936055865574}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9953343262297011, "res": {"Yes": 0.9953343262297011, "No": 0.004664978749493804}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7209881480810855, "res": {"Yes": 0.7209881480810855, "No": 0.27900998758661777}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999738203326934, "res": {"Yes": 0.9999738203326934, "No": 2.6041399443449644e-05}, "ground_truth": 1}, {"key": "39984637", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998922397231315, "res": {"Yes": 0.998922397231315, "No": 0.0010765740024020621}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997127227020275, "res": {"Yes": 0.9997127227020275, "No": 0.00028657192677563324}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.26950067068745104, "res": {"No": 0.7304941909347027, "Yes": 0.26950067068745104}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7744950270484434, "res": {"Yes": 0.7744950270484434, "No": 0.22550097417098983}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9407127343460726, "res": {"Yes": 0.9407127343460726, "No": 0.059284285980034455}, "ground_truth": 1}, {"key": "17917326", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9871102851995763, "res": {"Yes": 0.9871102851995763, "No": 0.01288789603430834}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9476967953635429, "res": {"Yes": 0.9476967953635429, "No": 0.05229844189696858}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9411546306688687, "res": {"Yes": 0.9411546306688687, "No": 0.058842929319280195}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994015134345732, "res": {"Yes": 0.9994015134345732, "No": 0.0005981890600799087}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9850916041471866, "res": {"Yes": 0.9850916041471866, "No": 0.014906782026875771}, "ground_truth": 1}, {"key": "32193638", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9938900471433613, "res": {"Yes": 0.9938900471433613, "No": 0.006107962690164037}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9839182801565536, "res": {"Yes": 0.9839182801565536, "No": 0.016069985524676263}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9861638359123474, "res": {"Yes": 0.9861638359123474, "No": 0.013834266290513876}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8722750417107884, "res": {"Yes": 0.8722750417107884, "No": 0.12771558238663375}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.11163730619435719, "res": {"No": 0.888351127761238, "Yes": 0.11163730619435719}, "ground_truth": 1}, {"key": "34564692", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9918589790682769, "res": {"Yes": 0.9918589790682769, "No": 0.008139713468640111}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.12845036678002475, "res": {"No": 0.8715262970569685, "Yes": 0.12845036678002475}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9830822037007403, "res": {"Yes": 0.9830822037007403, "No": 0.016907955976318872}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993729440817869, "res": {"Yes": 0.9993729440817869, "No": 0.0006262956587745753}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991311947300391, "res": {"Yes": 0.9991311947300391, "No": 0.0008680687859131816}, "ground_truth": 1}, {"key": "39329284", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9977563899639607, "res": {"Yes": 0.9977563899639607, "No": 0.002240820915765989}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.13224751481358363, "res": {"No": 0.8677309480986197, "Yes": 0.13224751481358363}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9922337123687462, "res": {"Yes": 0.9922337123687462, "No": 0.00776575419191611}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9956518781734824, "res": {"Yes": 0.9956518781734824, "No": 0.004347866560724016}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9849657736275531, "res": {"Yes": 0.9849657736275531, "No": 0.015032506840548954}, "ground_truth": 1}, {"key": "37438541", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9949857000856851, "res": {"Yes": 0.9949857000856851, "No": 0.005013414796292993}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999414491636959, "res": {"Yes": 0.999414491636959, "No": 0.0005850310121004442}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.10764749772332309, "res": {"No": 0.8923513087929583, "Yes": 0.10764749772332309}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999118462083051, "res": {"Yes": 0.999118462083051, "No": 0.0008803561644891872}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9930243277424065, "res": {"Yes": 0.9930243277424065, "No": 0.006973372582526368}, "ground_truth": 1}, {"key": "34652757", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.994405266839264, "res": {"Yes": 0.994405266839264, "No": 0.005593891948471609}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.944855136451079, "res": {"Yes": 0.944855136451079, "No": 0.055142115949128656}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.998726173306866, "res": {"Yes": 0.998726173306866, "No": 0.001272728828211268}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996655437429679, "res": {"Yes": 0.9996655437429679, "No": 0.0003337067315333525}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990041284095803, "res": {"Yes": 0.9990041284095803, "No": 0.0009943866927973135}, "ground_truth": 1}, {"key": "31361004", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999486418058378, "res": {"Yes": 0.999486418058378, "No": 0.0005131912372991479}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9969653398180233, "res": {"Yes": 0.9969653398180233, "No": 0.0030335825444232955}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1669115245615358, "res": {"No": 0.8330865505432252, "Yes": 0.1669115245615358}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9623049198865928, "res": {"Yes": 0.9623049198865928, "No": 0.03769243001682239}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998900258575993, "res": {"Yes": 0.9998900258575993, "No": 0.00010953931851091673}, "ground_truth": 1}, {"key": "26150727", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9791326110567883, "res": {"Yes": 0.9791326110567883, "No": 0.020863396898032335}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978456362799178, "res": {"Yes": 0.9978456362799178, "No": 0.002153336024691035}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9922257311705334, "res": {"Yes": 0.9922257311705334, "No": 0.007773692517577106}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8506360629403706, "res": {"Yes": 0.8506360629403706, "No": 0.14936069896889684}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9965140010521932, "res": {"Yes": 0.9965140010521932, "No": 0.003485488752441472}, "ground_truth": 1}, {"key": "36997402", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9889213344681841, "res": {"Yes": 0.9889213344681841, "No": 0.011077159426286468}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9813992466053534, "res": {"Yes": 0.9813992466053534, "No": 0.018599882788060778}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0006106823007873602, "res": {"No": 0.9993885427762071, "Yes": 0.0006106823007873602}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9780406630997966, "res": {"Yes": 0.9780406630997966, "No": 0.021956799834202127}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9964528016255259, "res": {"Yes": 0.9964528016255259, "No": 0.0035446742968112707}, "ground_truth": 1}, {"key": "37430643", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7457505112768887, "res": {"Yes": 0.7457505112768887, "No": 0.2542355447865305}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6617715984661946, "res": {"Yes": 0.6617715984661946, "No": 0.33821009289006954}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3125755121861502, "res": {"No": 0.6874160403680926, "Yes": 0.3125755121861502}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9921360667905725, "res": {"Yes": 0.9921360667905725, "No": 0.007862038932582562}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.986006084998965, "res": {"Yes": 0.986006084998965, "No": 0.013992053747094807}, "ground_truth": 1}, {"key": "36964631", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.997120109663127, "res": {"Yes": 0.997120109663127, "No": 0.0028787831254756583}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9613298218249979, "res": {"Yes": 0.9613298218249979, "No": 0.03866839033144733}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2060295034122108, "res": {"No": 0.7939695647649205, "Yes": 0.2060295034122108}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9101345711680682, "res": {"Yes": 0.9101345711680682, "No": 0.0898639067789871}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9479544655508984, "res": {"Yes": 0.9479544655508984, "No": 0.05204454460900767}, "ground_truth": 1}, {"key": "35502013", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9764555572401432, "res": {"Yes": 0.9764555572401432, "No": 0.023543968640612815}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9007425142166623, "res": {"Yes": 0.9007425142166623, "No": 0.09925565338292774}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.41091189288892804, "res": {"No": 0.5890848193563433, "Yes": 0.41091189288892804}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9902718218648676, "res": {"Yes": 0.9902718218648676, "No": 0.009727192159705507}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9857062388213438, "res": {"Yes": 0.9857062388213438, "No": 0.014288849516121811}, "ground_truth": 1}, {"key": "33987664", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9089614908531638, "res": {"Yes": 0.9089614908531638, "No": 0.09103594959342352}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9397935344927941, "res": {"Yes": 0.9397935344927941, "No": 0.06019942970807647}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9967848077364058, "res": {"Yes": 0.9967848077364058, "No": 0.0032148209979389088}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997507311526429, "res": {"Yes": 0.9997507311526429, "No": 0.0002489959317466268}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995784717679996, "res": {"Yes": 0.9995784717679996, "No": 0.00042135620052516235}, "ground_truth": 1}, {"key": "35203721", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968607330353679, "res": {"Yes": 0.9968607330353679, "No": 0.0031387689816244147}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984275736597823, "res": {"Yes": 0.9984275736597823, "No": 0.0015719317530623743}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9953556996713013, "res": {"Yes": 0.9953556996713013, "No": 0.004644058585109839}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9728732349170034, "res": {"Yes": 0.9728732349170034, "No": 0.027124744134377828}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968065976904662, "res": {"Yes": 0.9968065976904662, "No": 0.0031930506581434805}, "ground_truth": 1}, {"key": "39028348", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9981024391493765, "res": {"Yes": 0.9981024391493765, "No": 0.001897418501648035}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.996959891417329, "res": {"Yes": 0.996959891417329, "No": 0.0030391390831618448}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06782728712721038, "res": {"No": 0.932171358635552, "Yes": 0.06782728712721038}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8261604458117439, "res": {"Yes": 0.8261604458117439, "No": 0.1738384776956895}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3808852348872107, "res": {"No": 0.6191133284111676, "Yes": 0.3808852348872107}, "ground_truth": 1}, {"key": "37459383", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5314701205477728, "res": {"Yes": 0.5314701205477728, "No": 0.46852899041367985}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8430931659042102, "res": {"Yes": 0.8430931659042102, "No": 0.15690596533264825}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9976755803568731, "res": {"Yes": 0.9976755803568731, "No": 0.0023241971765066145}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9940786146180275, "res": {"Yes": 0.9940786146180275, "No": 0.0059210273872491595}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9919611433247147, "res": {"Yes": 0.9919611433247147, "No": 0.008038134098711893}, "ground_truth": 1}, {"key": "34020070", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992903233097066, "res": {"Yes": 0.9992903233097066, "No": 0.0007088100357387544}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995209443438209, "res": {"Yes": 0.9995209443438209, "No": 0.00047823371569444555}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8106521109240471, "res": {"Yes": 0.8106521109240471, "No": 0.18934695615397654}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9883596156586572, "res": {"Yes": 0.9883596156586572, "No": 0.01163989333943044}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9893103012912052, "res": {"Yes": 0.9893103012912052, "No": 0.01068931109387289}, "ground_truth": 1}, {"key": "35176615", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9849225129108994, "res": {"Yes": 0.9849225129108994, "No": 0.015077148888904752}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8278266967052382, "res": {"Yes": 0.8278266967052382, "No": 0.17217153545226574}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9840158119540457, "res": {"Yes": 0.9840158119540457, "No": 0.01598201102806113}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.43026494881857114, "res": {"No": 0.5697301792301774, "Yes": 0.43026494881857114}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9482265295982154, "res": {"Yes": 0.9482265295982154, "No": 0.05176817503966416}, "ground_truth": 1}, {"key": "33296389", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3882708173402107, "res": {"No": 0.6116938541180288, "Yes": 0.3882708173402107}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5419036071206214, "res": {"Yes": 0.5419036071206214, "No": 0.4580936361599758}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998775182714994, "res": {"Yes": 0.9998775182714994, "No": 0.00012230330401229053}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9966019540702501, "res": {"Yes": 0.9966019540702501, "No": 0.003397834371015448}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995557247195026, "res": {"Yes": 0.9995557247195026, "No": 0.000444001463218641}, "ground_truth": 1}, {"key": "35399504", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996746002139981, "res": {"Yes": 0.9996746002139981, "No": 0.0003252355073688265}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996968769710715, "res": {"Yes": 0.9996968769710715, "No": 0.0003028357435316941}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9939985128037222, "res": {"Yes": 0.9939985128037222, "No": 0.006000860520226517}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989477386156908, "res": {"Yes": 0.9989477386156908, "No": 0.0010522116465164694}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999852131313652, "res": {"Yes": 0.999852131313652, "No": 0.00014768092849805199}, "ground_truth": 1}, {"key": "34807886", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999137450601713, "res": {"Yes": 0.9999137450601713, "No": 8.611861222769542e-05}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994974910999104, "res": {"Yes": 0.9994974910999104, "No": 0.0005023941434620228}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.01746176928648222, "res": {"No": 0.982537461708713, "Yes": 0.01746176928648222}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.986224714671136, "res": {"Yes": 0.986224714671136, "No": 0.013774713812789947}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998896682929905, "res": {"Yes": 0.9998896682929905, "No": 0.00011005261371763576}, "ground_truth": 1}, {"key": "37629813", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996865131172844, "res": {"Yes": 0.9996865131172844, "No": 0.00031323683255867537}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9986864583520334, "res": {"Yes": 0.9986864583520334, "No": 0.0013134027374008543}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.027990687875431543, "res": {"No": 0.9720089293401052, "Yes": 0.027990687875431543}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998735850310456, "res": {"Yes": 0.9998735850310456, "No": 0.00012564036225755885}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999920581810364, "res": {"Yes": 0.9999920581810364, "No": 7.737027407573793e-06}, "ground_truth": 1}, {"key": "28084389", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999962302846054, "res": {"Yes": 0.9999962302846054, "No": 3.4793119473676298e-06}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999551060207649, "res": {"Yes": 0.9999551060207649, "No": 4.479715164129377e-05}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.37797324737778515, "res": {"No": 0.622025413102258, "Yes": 0.37797324737778515}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.001627552868375903, "res": {"No": 0.9983719669858687, "Yes": 0.001627552868375903}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8307045357482812, "res": {"Yes": 0.8307045357482812, "No": 0.1692946654144752}, "ground_truth": 1}, {"key": "35391734", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.24671417466593396, "res": {"No": 0.7532832951177858, "Yes": 0.24671417466593396}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9814522907052847, "res": {"Yes": 0.9814522907052847, "No": 0.01854633098607317}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.43302842780733375, "res": {"No": 0.5669708655977747, "Yes": 0.43302842780733375}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9843960490843071, "res": {"Yes": 0.9843960490843071, "No": 0.015602871674014506}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9841346006561298, "res": {"Yes": 0.9841346006561298, "No": 0.015864815236444698}, "ground_truth": 1}, {"key": "40214591", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9933299521822124, "res": {"Yes": 0.9933299521822124, "No": 0.006669582598155051}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9896847360532804, "res": {"Yes": 0.9896847360532804, "No": 0.010314465000188466}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.31980674100165934, "res": {"No": 0.6801891212464257, "Yes": 0.31980674100165934}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9706214330365386, "res": {"Yes": 0.9706214330365386, "No": 0.02937694194314763}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987909744610064, "res": {"Yes": 0.9987909744610064, "No": 0.0012078669817233282}, "ground_truth": 1}, {"key": "26283171", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.995565261621808, "res": {"Yes": 0.995565261621808, "No": 0.00443185077502092}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9191413913303648, "res": {"Yes": 0.9191413913303648, "No": 0.08085687197276738}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995367872561645, "res": {"Yes": 0.9995367872561645, "No": 0.00046250462549108447}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992748452518809, "res": {"Yes": 0.9992748452518809, "No": 0.0007248442889781796}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9978800620492791, "res": {"Yes": 0.9978800620492791, "No": 0.0021194259611633697}, "ground_truth": 1}, {"key": "37084030", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999508329509569, "res": {"Yes": 0.999508329509569, "No": 0.0004914922433935277}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984301918398415, "res": {"Yes": 0.9984301918398415, "No": 0.0015695144107164734}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.76238568732632, "res": {"Yes": 0.76238568732632, "No": 0.23761019123744773}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7364977264865256, "res": {"Yes": 0.7364977264865256, "No": 0.2635014521526911}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9251883320292886, "res": {"Yes": 0.9251883320292886, "No": 0.07480975410725228}, "ground_truth": 1}, {"key": "39027295", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.49127774943231173, "res": {"No": 0.5087205657086473, "Yes": 0.49127774943231173}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8272371960728374, "res": {"Yes": 0.8272371960728374, "No": 0.17275725847424647}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9981668099492395, "res": {"Yes": 0.9981668099492395, "No": 0.0018331147679511164}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998016050428828, "res": {"Yes": 0.9998016050428828, "No": 0.0001981349883933189}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995383361995424, "res": {"Yes": 0.9995383361995424, "No": 0.0004614463786712127}, "ground_truth": 1}, {"key": "14018647", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997603732950662, "res": {"Yes": 0.9997603732950662, "No": 0.00023953620103229977}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999206582977194, "res": {"Yes": 0.9999206582977194, "No": 7.896743544783722e-05}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6251425220261371, "res": {"Yes": 0.6251425220261371, "No": 0.37485645985810606}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6258249372171376, "res": {"Yes": 0.6258249372171376, "No": 0.3741678595245623}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.11336734410674963, "res": {"No": 0.8866323408065105, "Yes": 0.11336734410674963}, "ground_truth": 1}, {"key": "37424289", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9861347464805578, "res": {"Yes": 0.9861347464805578, "No": 0.013864710223341282}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.10204377409149135, "res": {"No": 0.897953979289859, "Yes": 0.10204377409149135}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9769576449778657, "res": {"Yes": 0.9769576449778657, "No": 0.0230421069466099}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998939591587275, "res": {"Yes": 0.9998939591587275, "No": 0.00010584603709076823}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994621243070224, "res": {"Yes": 0.9994621243070224, "No": 0.0005376692305401375}, "ground_truth": 1}, {"key": "37498031", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993579449056404, "res": {"Yes": 0.9993579449056404, "No": 0.0006418084906135326}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999782301739706, "res": {"Yes": 0.999782301739706, "No": 0.00021751668450713368}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9920064239124857, "res": {"Yes": 0.9920064239124857, "No": 0.007993307099663075}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.978991256053191, "res": {"Yes": 0.978991256053191, "No": 0.02100771768424397}, "ground_truth": 1}, {"key": "30104095", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9979489133589139, "res": {"Yes": 0.9979489133589139, "No": 0.0020510399946682177}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9920849105974554, "res": {"Yes": 0.9920849105974554, "No": 0.007913838841094535}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.993631989569215, "res": {"Yes": 0.993631989569215, "No": 0.006367018323916499}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8857742125167051, "res": {"Yes": 0.8857742125167051, "No": 0.11422256606626606}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9104134336065185, "res": {"Yes": 0.9104134336065185, "No": 0.08958503437648334}, "ground_truth": 1}, {"key": "37911407", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9390678355978525, "res": {"Yes": 0.9390678355978525, "No": 0.060929367228281024}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9775217565794759, "res": {"Yes": 0.9775217565794759, "No": 0.022476364242987996}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9275494783439443, "res": {"Yes": 0.9275494783439443, "No": 0.07244953706158809}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9774798325479043, "res": {"Yes": 0.9774798325479043, "No": 0.02251976975018085}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9841302104414686, "res": {"Yes": 0.9841302104414686, "No": 0.015869286571359824}, "ground_truth": 1}, {"key": "39177472", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9909615545560367, "res": {"Yes": 0.9909615545560367, "No": 0.00903812985885408}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9938011451702303, "res": {"Yes": 0.9938011451702303, "No": 0.006198154453708024}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5704964113837306, "res": {"Yes": 0.5704964113837306, "No": 0.42950291526598045}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9977689716515892, "res": {"Yes": 0.9977689716515892, "No": 0.002230282544425439}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9967328076268279, "res": {"Yes": 0.9967328076268279, "No": 0.003266411164440056}, "ground_truth": 1}, {"key": "32325454", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9823942014888007, "res": {"Yes": 0.9823942014888007, "No": 0.01760528742818033}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9560868813374348, "res": {"Yes": 0.9560868813374348, "No": 0.04390996462649196}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9974156753315095, "res": {"Yes": 0.9974156753315095, "No": 0.002584283462418291}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974945465009809, "res": {"Yes": 0.9974945465009809, "No": 0.0025050582280122364}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9929927040953086, "res": {"Yes": 0.9929927040953086, "No": 0.007006345784106017}, "ground_truth": 1}, {"key": "38395319", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9958639351747895, "res": {"Yes": 0.9958639351747895, "No": 0.00413550429609326}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9926030818578478, "res": {"Yes": 0.9926030818578478, "No": 0.007396058912756519}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.99713077790825, "res": {"Yes": 0.99713077790825, "No": 0.0028688586822295118}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9938070354470736, "res": {"Yes": 0.9938070354470736, "No": 0.00619173834829404}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998392169546534, "res": {"Yes": 0.998392169546534, "No": 0.0016070350204899911}, "ground_truth": 1}, {"key": "38235895", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998384686525427, "res": {"Yes": 0.998384686525427, "No": 0.0016144582943967932}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9007247157204311, "res": {"Yes": 0.9007247157204311, "No": 0.09926807104187432}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08468853894484149, "res": {"No": 0.9153107260895588, "Yes": 0.08468853894484149}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9771929960404048, "res": {"Yes": 0.9771929960404048, "No": 0.022806447452338847}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9841822782117189, "res": {"Yes": 0.9841822782117189, "No": 0.015817485083206642}, "ground_truth": 1}, {"key": "26543267", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975820828821309, "res": {"Yes": 0.9975820828821309, "No": 0.002417781971007434}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9720129845698176, "res": {"Yes": 0.9720129845698176, "No": 0.027986108973459514}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0064023574812357735, "res": {"No": 0.9935944436085202, "Yes": 0.0064023574812357735}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6178004191759939, "res": {"Yes": 0.6178004191759939, "No": 0.38219587882687256}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4449110519738671, "res": {"No": 0.5550647918374866, "Yes": 0.4449110519738671}, "ground_truth": 1}, {"key": "39054728", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8560131934930524, "res": {"Yes": 0.8560131934930524, "No": 0.14398212774366415}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.1615400951419166, "res": {"No": 0.8384495135222437, "Yes": 0.1615400951419166}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9897702108972917, "res": {"Yes": 0.9897702108972917, "No": 0.010225521253655574}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6391536242260505, "res": {"Yes": 0.6391536242260505, "No": 0.360840588961255}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9864738270416594, "res": {"Yes": 0.9864738270416594, "No": 0.01352479921271615}, "ground_truth": 1}, {"key": "39158443", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.11391337361652612, "res": {"No": 0.8860763218891463, "Yes": 0.11391337361652612}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.015436043765857263, "res": {"No": 0.9845610339047759, "Yes": 0.015436043765857263}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3501379707615798, "res": {"No": 0.6498609123432771, "Yes": 0.3501379707615798}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8014051776858924, "res": {"Yes": 0.8014051776858924, "No": 0.19859186300259168}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7849434986752601, "res": {"Yes": 0.7849434986752601, "No": 0.21505544508168561}, "ground_truth": 1}, {"key": "36254201", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9752842880476248, "res": {"Yes": 0.9752842880476248, "No": 0.024715161444424035}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9833751498002102, "res": {"Yes": 0.9833751498002102, "No": 0.01662444627104038}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 5.020580934229912e-07, "res": {"No": 0.9999992103693117, "Yes": 5.020580934229912e-07}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9906985803310404, "res": {"Yes": 0.9906985803310404, "No": 0.009301240505779983}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9917833368358813, "res": {"Yes": 0.9917833368358813, "No": 0.008216392786408675}, "ground_truth": 1}, {"key": "23434347", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9932665505508281, "res": {"Yes": 0.9932665505508281, "No": 0.006733061737981131}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9757348856728798, "res": {"Yes": 0.9757348856728798, "No": 0.02426452189018242}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9993513965841927, "res": {"Yes": 0.9993513965841927, "No": 0.0006482163784427934}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999856064459714, "res": {"Yes": 0.999856064459714, "No": 0.00014343078121630633}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9977644591518421, "res": {"Yes": 0.9977644591518421, "No": 0.0022348025485210694}, "ground_truth": 1}, {"key": "34397620", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9957582443665515, "res": {"Yes": 0.9957582443665515, "No": 0.0042406250633593495}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9940452768619625, "res": {"Yes": 0.9940452768619625, "No": 0.0059516963453444885}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9915283588148976, "res": {"Yes": 0.9915283588148976, "No": 0.008470571492874123}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994631965605485, "res": {"Yes": 0.9994631965605485, "No": 0.0005364098733679083}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996589934259632, "res": {"Yes": 0.9996589934259632, "No": 0.00034085274731506703}, "ground_truth": 1}, {"key": "34340916", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997265427962388, "res": {"Yes": 0.9997265427962388, "No": 0.00027322306732289564}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9923348835918837, "res": {"Yes": 0.9923348835918837, "No": 0.007664710012921954}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9809573994468602, "res": {"Yes": 0.9809573994468602, "No": 0.01904176032211349}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5784379721291636, "res": {"Yes": 0.5784379721291636, "No": 0.42156046494569444}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993448447080114, "res": {"Yes": 0.9993448447080114, "No": 0.0006541790285551501}, "ground_truth": 1}, {"key": "30375089", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978146575453962, "res": {"Yes": 0.9978146575453962, "No": 0.00218474316929503}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9986462763116828, "res": {"Yes": 0.9986462763116828, "No": 0.0013508183297412867}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9875671060717849, "res": {"Yes": 0.9875671060717849, "No": 0.012430307937916133}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9674014207181574, "res": {"Yes": 0.9674014207181574, "No": 0.03259379650417936}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9975122196674199, "res": {"Yes": 0.9975122196674199, "No": 0.0024857687776851686}, "ground_truth": 1}, {"key": "35807797", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9977531858740102, "res": {"Yes": 0.9977531858740102, "No": 0.002245682039816087}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.026477935909196105, "res": {"No": 0.9735200583660231, "Yes": 0.026477935909196105}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9982608858146923, "res": {"Yes": 0.9982608858146923, "No": 0.0017388632219170806}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999298363015874, "res": {"Yes": 0.9999298363015874, "No": 7.001311334217462e-05}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999826412106655, "res": {"Yes": 0.9999826412106655, "No": 1.720903536765477e-05}, "ground_truth": 1}, {"key": "34188172", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999175592584247, "res": {"Yes": 0.9999175592584247, "No": 8.22639975351555e-05}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999889589149532, "res": {"Yes": 0.9999889589149532, "No": 1.0968171274381617e-05}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9941986601390026, "res": {"Yes": 0.9941986601390026, "No": 0.005801094339519213}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8115943521199872, "res": {"Yes": 0.8115943521199872, "No": 0.18840418569912867}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6823269412570724, "res": {"Yes": 0.6823269412570724, "No": 0.31767119789506015}, "ground_truth": 1}, {"key": "37075567", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8386732333097303, "res": {"Yes": 0.8386732333097303, "No": 0.16131159689502983}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8701752507288264, "res": {"Yes": 0.8701752507288264, "No": 0.12982145443052528}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9865608270181565, "res": {"Yes": 0.9865608270181565, "No": 0.013438201094243022}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997722908696604, "res": {"Yes": 0.9997722908696604, "No": 0.00022663517317285763}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997856387386591, "res": {"Yes": 0.9997856387386591, "No": 0.00021385186548399316}, "ground_truth": 1}, {"key": "35559735", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995969370916878, "res": {"Yes": 0.9995969370916878, "No": 0.0004022141096751521}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995992010113826, "res": {"Yes": 0.9995992010113826, "No": 0.00039981164870170696}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08022584172400987, "res": {"No": 0.9197732874425298, "Yes": 0.08022584172400987}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9973547185394015, "res": {"Yes": 0.9973547185394015, "No": 0.0026450436790227566}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994258057126708, "res": {"Yes": 0.9994258057126708, "No": 0.0005739975671892176}, "ground_truth": 1}, {"key": "33005019", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9981164493122121, "res": {"Yes": 0.9981164493122121, "No": 0.0018833250890444512}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987473391354451, "res": {"Yes": 0.9987473391354451, "No": 0.0012520914072295074}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.05638399146732098, "res": {"No": 0.9435884951786517, "Yes": 0.05638399146732098}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9935862003857729, "res": {"Yes": 0.9935862003857729, "No": 0.006413552175473717}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9327428802353044, "res": {"Yes": 0.9327428802353044, "No": 0.06725548516732115}, "ground_truth": 1}, {"key": "30808252", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.928320332384198, "res": {"Yes": 0.928320332384198, "No": 0.0716761802971886}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6462284499636405, "res": {"Yes": 0.6462284499636405, "No": 0.3537650806926768}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9856190382334328, "res": {"Yes": 0.9856190382334328, "No": 0.01438070358300307}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9540021346096815, "res": {"Yes": 0.9540021346096815, "No": 0.045996673514962935}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9915733717537458, "res": {"Yes": 0.9915733717537458, "No": 0.008425579683057436}, "ground_truth": 1}, {"key": "15159017", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9763284934877098, "res": {"Yes": 0.9763284934877098, "No": 0.02366832080221497}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9867372211168585, "res": {"Yes": 0.9867372211168585, "No": 0.013259208325049832}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9984797498527728, "res": {"Yes": 0.9984797498527728, "No": 0.0015201291205523462}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9983565177984001, "res": {"Yes": 0.9983565177984001, "No": 0.0016433681388374304}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992543757160417, "res": {"Yes": 0.9992543757160417, "No": 0.000745218048393852}, "ground_truth": 1}, {"key": "24493400", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999684963934286, "res": {"Yes": 0.999684963934286, "No": 0.0003147710527703323}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998888339594022, "res": {"Yes": 0.9998888339594022, "No": 0.00011108298759516829}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.033772230399276085, "res": {"No": 0.9662269639861393, "Yes": 0.033772230399276085}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.996138286268606, "res": {"Yes": 0.996138286268606, "No": 0.0038613407934631294}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968446163200652, "res": {"Yes": 0.9968446163200652, "No": 0.0031547071759199085}, "ground_truth": 1}, {"key": "37791071", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7602388186480755, "res": {"Yes": 0.7602388186480755, "No": 0.23976058884498444}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.019669526874941765, "res": {"No": 0.9803287219505379, "Yes": 0.019669526874941765}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5753917533484385, "res": {"Yes": 0.5753917533484385, "No": 0.4246056598338538}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9959513081421968, "res": {"Yes": 0.9959513081421968, "No": 0.004047943518637787}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983402396282507, "res": {"Yes": 0.9983402396282507, "No": 0.001659062492013744}, "ground_truth": 1}, {"key": "33528627", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9855470167537308, "res": {"Yes": 0.9855470167537308, "No": 0.014450810153632589}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9961049365155084, "res": {"Yes": 0.9961049365155084, "No": 0.003894139298784595}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9938501250715869, "res": {"Yes": 0.9938501250715869, "No": 0.006149589176279065}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9975157796951334, "res": {"Yes": 0.9975157796951334, "No": 0.0024838537337451795}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983218267101748, "res": {"Yes": 0.9983218267101748, "No": 0.0016778903814131706}, "ground_truth": 1}, {"key": "39925662", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991607100310176, "res": {"Yes": 0.9991607100310176, "No": 0.0008389373722436034}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9027060992738611, "res": {"Yes": 0.9027060992738611, "No": 0.09729051271914518}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9929011477360596, "res": {"Yes": 0.9929011477360596, "No": 0.007098647542866615}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9915351562608614, "res": {"Yes": 0.9915351562608614, "No": 0.008463684331410109}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9977966221086763, "res": {"Yes": 0.9977966221086763, "No": 0.00220118373930847}, "ground_truth": 1}, {"key": "29213416", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9750923602589794, "res": {"Yes": 0.9750923602589794, "No": 0.024898311227506444}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9893130990646933, "res": {"Yes": 0.9893130990646933, "No": 0.010681761762700316}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9108756858815645, "res": {"Yes": 0.9108756858815645, "No": 0.08912322645222086}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9950187458010098, "res": {"Yes": 0.9950187458010098, "No": 0.004981019450300002}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9965211031331351, "res": {"Yes": 0.9965211031331351, "No": 0.0034782882096288576}, "ground_truth": 1}, {"key": "34492745", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978470634995521, "res": {"Yes": 0.9978470634995521, "No": 0.0021525093023983914}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975555192210706, "res": {"Yes": 0.9975555192210706, "No": 0.002443167318753552}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6038336094755066, "res": {"Yes": 0.6038336094755066, "No": 0.3961654309653348}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9788260759841877, "res": {"Yes": 0.9788260759841877, "No": 0.021172946938587726}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6518918793659456, "res": {"Yes": 0.6518918793659456, "No": 0.3480750714203985}, "ground_truth": 1}, {"key": "34191937", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7051490571049979, "res": {"Yes": 0.7051490571049979, "No": 0.29484042535449045}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7656825046157225, "res": {"Yes": 0.7656825046157225, "No": 0.23429714939898408}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00519837865047204, "res": {"No": 0.9948012627530539, "Yes": 0.00519837865047204}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.2518360999737788, "res": {"No": 0.7481358274445193, "Yes": 0.2518360999737788}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.02633084535069841, "res": {"No": 0.9736674117775449, "Yes": 0.02633084535069841}, "ground_truth": 1}, {"key": "34933372", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9369531893461833, "res": {"Yes": 0.9369531893461833, "No": 0.06304408723207887}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8899128343365322, "res": {"Yes": 0.8899128343365322, "No": 0.11008292869502366}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.011847433703027179, "res": {"No": 0.988151793884883, "Yes": 0.011847433703027179}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0013951448973984477, "res": {"No": 0.998604548249524, "Yes": 0.0013951448973984477}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.024709462785275603, "res": {"No": 0.9752899573916692, "Yes": 0.024709462785275603}, "ground_truth": 1}, {"key": "38714379", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.03600583393159088, "res": {"No": 0.9639930200594837, "Yes": 0.03600583393159088}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.004753264185499632, "res": {"No": 0.9952459942280387, "Yes": 0.004753264185499632}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.05693824611172261, "res": {"No": 0.9430606428366436, "Yes": 0.05693824611172261}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.007396421328522356, "res": {"No": 0.9925988517895676, "Yes": 0.007396421328522356}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.164919187134979, "res": {"No": 0.8350754157051208, "Yes": 0.164919187134979}, "ground_truth": 1}, {"key": "39220660", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.22477308427585635, "res": {"No": 0.7752176425167631, "Yes": 0.22477308427585635}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0012349587626826965, "res": {"No": 0.9987631551239118, "Yes": 0.0012349587626826965}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.11355411176883518, "res": {"No": 0.886444580826596, "Yes": 0.11355411176883518}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7540895737147015, "res": {"Yes": 0.7540895737147015, "No": 0.24590745820108373}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6296787690699595, "res": {"Yes": 0.6296787690699595, "No": 0.37031874915711055}, "ground_truth": 1}, {"key": "41028780", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7834809041329902, "res": {"Yes": 0.7834809041329902, "No": 0.2165174574321221}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9967228565951706, "res": {"Yes": 0.9967228565951706, "No": 0.0032758365742359906}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3149318540215912, "res": {"No": 0.6850671954387102, "Yes": 0.3149318540215912}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993406789477088, "res": {"Yes": 0.9993406789477088, "No": 0.0006588091966887188}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.985990676802267, "res": {"Yes": 0.985990676802267, "No": 0.014001609383633347}, "ground_truth": 1}, {"key": "39457108", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.978867536998364, "res": {"Yes": 0.978867536998364, "No": 0.021120524207948323}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9153240119211696, "res": {"Yes": 0.9153240119211696, "No": 0.08466166306800767}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7835535753569244, "res": {"Yes": 0.7835535753569244, "No": 0.21644504445435683}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986392637422874, "res": {"Yes": 0.9986392637422874, "No": 0.0013603231461433668}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9958777588580167, "res": {"Yes": 0.9958777588580167, "No": 0.0041219385682879466}, "ground_truth": 1}, {"key": "38288018", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9939696509849303, "res": {"Yes": 0.9939696509849303, "No": 0.006029184004721831}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978414841530794, "res": {"Yes": 0.9978414841530794, "No": 0.0021579480190375435}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06568666119864065, "res": {"No": 0.9343123171292784, "Yes": 0.06568666119864065}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998300858170501, "res": {"Yes": 0.9998300858170501, "No": 0.00016975760353173393}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9978668879240878, "res": {"Yes": 0.9978668879240878, "No": 0.002133032932692638}, "ground_truth": 1}, {"key": "40106293", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989846169505887, "res": {"Yes": 0.9989846169505887, "No": 0.0010151177128109512}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9920427875664297, "res": {"Yes": 0.9920427875664297, "No": 0.00795593888216647}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.07783547304320822, "res": {"No": 0.9221640802805856, "Yes": 0.07783547304320822}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9526061315395413, "res": {"Yes": 0.9526061315395413, "No": 0.047391660716993196}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9959197379820539, "res": {"Yes": 0.9959197379820539, "No": 0.004077121721243243}, "ground_truth": 1}, {"key": "39948797", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9914171517606265, "res": {"Yes": 0.9914171517606265, "No": 0.008579960235929985}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9180708800122211, "res": {"Yes": 0.9180708800122211, "No": 0.08191819103721484}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.036330557043042624, "res": {"No": 0.9636643400253443, "Yes": 0.036330557043042624}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.40658637009700993, "res": {"No": 0.5934081718420893, "Yes": 0.40658637009700993}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984186620345593, "res": {"Yes": 0.9984186620345593, "No": 0.0015809015395793938}, "ground_truth": 1}, {"key": "31853399", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9332781390198922, "res": {"Yes": 0.9332781390198922, "No": 0.06671768625267895}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8896857486605815, "res": {"Yes": 0.8896857486605815, "No": 0.11031206226482039}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8682916747061732, "res": {"Yes": 0.8682916747061732, "No": 0.1317064758788821}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7388722660475673, "res": {"Yes": 0.7388722660475673, "No": 0.26112673886468907}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7553615576930336, "res": {"Yes": 0.7553615576930336, "No": 0.24463665745792576}, "ground_truth": 1}, {"key": "35273252", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9752009564913305, "res": {"Yes": 0.9752009564913305, "No": 0.024798138230004083}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.11650414817009785, "res": {"No": 0.8834951118045007, "Yes": 0.11650414817009785}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9977978117822981, "res": {"Yes": 0.9977978117822981, "No": 0.002201665411003592}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997570363904394, "res": {"Yes": 0.9997570363904394, "No": 0.00024105679218869438}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997552597537814, "res": {"Yes": 0.9997552597537814, "No": 0.00024404961821607277}, "ground_truth": 1}, {"key": "37130459", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999323394050813, "res": {"Yes": 0.9999323394050813, "No": 6.655891917097547e-05}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.996330190470856, "res": {"Yes": 0.996330190470856, "No": 0.0036694176792839116}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9566728150841525, "res": {"Yes": 0.9566728150841525, "No": 0.04332686922728085}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997750319291123, "res": {"Yes": 0.9997750319291123, "No": 0.0002248086414656647}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994187804335692, "res": {"Yes": 0.9994187804335692, "No": 0.000580575909300405}, "ground_truth": 1}, {"key": "21734003", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988952815511988, "res": {"Yes": 0.9988952815511988, "No": 0.0011046629645436812}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990076973582042, "res": {"Yes": 0.9990076973582042, "No": 0.0009920337788490595}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7627395163672288, "res": {"Yes": 0.7627395163672288, "No": 0.2372602355397873}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8609664600146305, "res": {"Yes": 0.8609664600146305, "No": 0.139031813213373}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999975250738268, "res": {"Yes": 0.999975250738268, "No": 2.442774454805121e-05}, "ground_truth": 1}, {"key": "33990737", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992439046142795, "res": {"Yes": 0.9992439046142795, "No": 0.0007556010747185407}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.951055118168557, "res": {"Yes": 0.951055118168557, "No": 0.04893798473964844}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004352619635860368, "res": {"No": 0.9956454947710589, "Yes": 0.004352619635860368}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.1278886136206897, "res": {"No": 0.8721050954764605, "Yes": 0.1278886136206897}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.03457804624117485, "res": {"No": 0.9654214280204004, "Yes": 0.03457804624117485}, "ground_truth": 1}, {"key": "34559912", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.41239378387538905, "res": {"No": 0.5876050737612921, "Yes": 0.41239378387538905}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.004050221937428736, "res": {"No": 0.9959494163344838, "Yes": 0.004050221937428736}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.765378267533693, "res": {"Yes": 0.765378267533693, "No": 0.23462074958970594}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978220175532359, "res": {"Yes": 0.9978220175532359, "No": 0.002177370767549969}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995291618091064, "res": {"Yes": 0.9995291618091064, "No": 0.00046934568161559716}, "ground_truth": 1}, {"key": "39820439", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984782026097512, "res": {"Yes": 0.9984782026097512, "No": 0.0015183828878933409}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992026023905815, "res": {"Yes": 0.9992026023905815, "No": 0.0007965899527202095}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9961486918838784, "res": {"Yes": 0.9961486918838784, "No": 0.003850849136754324}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9952020630489737, "res": {"Yes": 0.9952020630489737, "No": 0.004796129694307281}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9982355802219867, "res": {"Yes": 0.9982355802219867, "No": 0.0017641540416707252}, "ground_truth": 1}, {"key": "34759328", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986909748218853, "res": {"Yes": 0.9986909748218853, "No": 0.0013084779336343094}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.026155125600784944, "res": {"No": 0.9738409260061948, "Yes": 0.026155125600784944}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9937003634406935, "res": {"Yes": 0.9937003634406935, "No": 0.006299109530120704}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9740488797992378, "res": {"Yes": 0.9740488797992378, "No": 0.02595009781534206}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986556695228689, "res": {"Yes": 0.9986556695228689, "No": 0.0013441640275768077}, "ground_truth": 1}, {"key": "36939137", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9563429030922214, "res": {"Yes": 0.9563429030922214, "No": 0.0436556310689902}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9603275670922563, "res": {"Yes": 0.9603275670922563, "No": 0.03967148941652497}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.02464294318517038, "res": {"No": 0.9753544749562456, "Yes": 0.02464294318517038}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9698409752170981, "res": {"Yes": 0.9698409752170981, "No": 0.03014125643571093}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997638293726743, "res": {"Yes": 0.9997638293726743, "No": 0.0002358006059740031}, "ground_truth": 1}, {"key": "35851522", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9867698352944697, "res": {"Yes": 0.9867698352944697, "No": 0.013229584595836955}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9979749144582097, "res": {"Yes": 0.9979749144582097, "No": 0.0020242459867219824}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8374663710996257, "res": {"Yes": 0.8374663710996257, "No": 0.16253245078673953}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996039599145867, "res": {"Yes": 0.9996039599145867, "No": 0.0003958104986534178}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9885283776440155, "res": {"Yes": 0.9885283776440155, "No": 0.01147026780286093}, "ground_truth": 1}, {"key": "22412782", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986934711529659, "res": {"Yes": 0.9986934711529659, "No": 0.0013060425085468172}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9711262854902319, "res": {"Yes": 0.9711262854902319, "No": 0.028872473840805945}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0007929238251681107, "res": {"No": 0.9992055801186938, "Yes": 0.0007929238251681107}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9675061891929551, "res": {"Yes": 0.9675061891929551, "No": 0.03249081321217068}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.955786004168308, "res": {"Yes": 0.955786004168308, "No": 0.044210392195015186}, "ground_truth": 1}, {"key": "38579227", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9278841614602623, "res": {"Yes": 0.9278841614602623, "No": 0.07210724170489106}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.635193088457661, "res": {"Yes": 0.635193088457661, "No": 0.3647885530408585}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9794998389678052, "res": {"Yes": 0.9794998389678052, "No": 0.02049918191949812}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9937796012856251, "res": {"Yes": 0.9937796012856251, "No": 0.006218410198484489}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9800694053887612, "res": {"Yes": 0.9800694053887612, "No": 0.01992779874858777}, "ground_truth": 1}, {"key": "37206995", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982907031147399, "res": {"Yes": 0.9982907031147399, "No": 0.001708132688769521}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.640815932554561, "res": {"Yes": 0.640815932554561, "No": 0.3591814092065402}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.13571269019091045, "res": {"No": 0.8642831361361321, "Yes": 0.13571269019091045}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.2849714725611841, "res": {"No": 0.7150257664102726, "Yes": 0.2849714725611841}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2912709340845738, "res": {"No": 0.7087248993120855, "Yes": 0.2912709340845738}, "ground_truth": 1}, {"key": "38700847", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.33795105556676824, "res": {"No": 0.6620471513349862, "Yes": 0.33795105556676824}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7555215148833296, "res": {"Yes": 0.7555215148833296, "No": 0.2444711189373255}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999511724841019, "res": {"Yes": 0.9999511724841019, "No": 4.86404047013851e-05}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9987738555301703, "res": {"Yes": 0.9987738555301703, "No": 0.0012255666138581104}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998117354140017, "res": {"Yes": 0.9998117354140017, "No": 0.0001881084311426835}, "ground_truth": 1}, {"key": "20246590", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997639485445299, "res": {"Yes": 0.9997639485445299, "No": 0.00023584376143350082}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9884516075572687, "res": {"Yes": 0.9884516075572687, "No": 0.011547915898317619}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09308068326071989, "res": {"No": 0.9069139106182849, "Yes": 0.09308068326071989}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9646513917335421, "res": {"Yes": 0.9646513917335421, "No": 0.03534768417856773}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998959159250891, "res": {"Yes": 0.998959159250891, "No": 0.0010396673216824283}, "ground_truth": 1}, {"key": "39141360", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.970132824873382, "res": {"Yes": 0.970132824873382, "No": 0.029865981164925243}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996689994827624, "res": {"Yes": 0.9996689994827624, "No": 0.00032988547803247366}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9658301465100226, "res": {"Yes": 0.9658301465100226, "No": 0.03416828173145696}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.995931202677698, "res": {"Yes": 0.995931202677698, "No": 0.004068187949179077}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9900210108479207, "res": {"Yes": 0.9900210108479207, "No": 0.009975449046764059}, "ground_truth": 1}, {"key": "37906226", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8981119432873423, "res": {"Yes": 0.8981119432873423, "No": 0.10188474047164889}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9836586996946848, "res": {"Yes": 0.9836586996946848, "No": 0.016339550485434777}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0010840752061544352, "res": {"No": 0.9989158556096318, "Yes": 0.0010840752061544352}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974613342759852, "res": {"Yes": 0.9974613342759852, "No": 0.002538072612431775}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999473581626301, "res": {"Yes": 0.9999473581626301, "No": 5.2529271046164054e-05}, "ground_truth": 1}, {"key": "16201033", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9956118198221121, "res": {"Yes": 0.9956118198221121, "No": 0.004386994107377048}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992915108370537, "res": {"Yes": 0.9992915108370537, "No": 0.0007082541923238043}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0006388448080404745, "res": {"No": 0.9993607966775409, "Yes": 0.0006388448080404745}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.22734256548353235, "res": {"No": 0.7726570421978672, "Yes": 0.22734256548353235}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.47023851701187225, "res": {"No": 0.5297531688858956, "Yes": 0.47023851701187225}, "ground_truth": 1}, {"key": "36469022", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.02220131849945917, "res": {"No": 0.9777953377019126, "Yes": 0.02220131849945917}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.06153993286532698, "res": {"No": 0.9384510575210175, "Yes": 0.06153993286532698}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.04325427095824947, "res": {"No": 0.9567435253849823, "Yes": 0.04325427095824947}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.4166641405717824, "res": {"No": 0.5833338587609707, "Yes": 0.4166641405717824}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4887210021901141, "res": {"No": 0.5112714073165219, "Yes": 0.4887210021901141}, "ground_truth": 1}, {"key": "31295270", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9841509846653417, "res": {"Yes": 0.9841509846653417, "No": 0.01584844326819613}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9555394231206387, "res": {"Yes": 0.9555394231206387, "No": 0.04445957187209435}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.014726561660875243, "res": {"No": 0.985273257009134, "Yes": 0.014726561660875243}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9468755532444558, "res": {"Yes": 0.9468755532444558, "No": 0.053123387773021946}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999171537514701, "res": {"Yes": 0.999171537514701, "No": 0.0008280125058578654}, "ground_truth": 1}, {"key": "35360689", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9977419126237757, "res": {"Yes": 0.9977419126237757, "No": 0.0022574493708773396}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9577811469208729, "res": {"Yes": 0.9577811469208729, "No": 0.04221686893575274}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.6078755229296705, "res": {"Yes": 0.6078755229296705, "No": 0.3921222600248793}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9970892906525046, "res": {"Yes": 0.9970892906525046, "No": 0.0029105057955461245}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9966640054361825, "res": {"Yes": 0.9966640054361825, "No": 0.003335474602981633}, "ground_truth": 1}, {"key": "29202793", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9365134455187903, "res": {"Yes": 0.9365134455187903, "No": 0.06348353487581891}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9947757877111069, "res": {"Yes": 0.9947757877111069, "No": 0.005224067322163619}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.00034100220991929904, "res": {"No": 0.9996586359179813, "Yes": 0.00034100220991929904}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985840996341157, "res": {"Yes": 0.9985840996341157, "No": 0.001414478170504887}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994799881030773, "res": {"Yes": 0.9994799881030773, "No": 0.0005188252690401718}, "ground_truth": 1}, {"key": "35999008", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9960575054187617, "res": {"Yes": 0.9960575054187617, "No": 0.0039415982134091915}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983990613716279, "res": {"Yes": 0.9983990613716279, "No": 0.0016003658814059923}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3174645247382098, "res": {"No": 0.6825336630426189, "Yes": 0.3174645247382098}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9767384344175892, "res": {"Yes": 0.9767384344175892, "No": 0.02326017054042424}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9947571465833263, "res": {"Yes": 0.9947571465833263, "No": 0.005242436016664584}, "ground_truth": 1}, {"key": "31797119", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998925288654362, "res": {"Yes": 0.9998925288654362, "No": 0.00010684333022505419}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6922547744169947, "res": {"Yes": 0.6922547744169947, "No": 0.30774098734010685}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9921347770145241, "res": {"Yes": 0.9921347770145241, "No": 0.0078647573092859}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9792333082739056, "res": {"Yes": 0.9792333082739056, "No": 0.020765963557796745}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7210787387227954, "res": {"Yes": 0.7210787387227954, "No": 0.27891840364202014}, "ground_truth": 1}, {"key": "26711893", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999302224358729, "res": {"Yes": 0.999302224358729, "No": 0.0006974567872161093}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8878824241436077, "res": {"Yes": 0.8878824241436077, "No": 0.11211383947635747}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9988241558471254, "res": {"Yes": 0.9988241558471254, "No": 0.0011752229555287287}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9969076481997613, "res": {"Yes": 0.9969076481997613, "No": 0.0030919036803107964}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9919457774696367, "res": {"Yes": 0.9919457774696367, "No": 0.008053234234323246}, "ground_truth": 1}, {"key": "35348288", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989890193855977, "res": {"Yes": 0.9989890193855977, "No": 0.0010104780937298177}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9959400738748023, "res": {"Yes": 0.9959400738748023, "No": 0.004059185261555644}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.943049936329941, "res": {"Yes": 0.943049936329941, "No": 0.0569476018341103}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6633492733795517, "res": {"Yes": 0.6633492733795517, "No": 0.3366477323301562}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9910320441583453, "res": {"Yes": 0.9910320441583453, "No": 0.00896733633168599}, "ground_truth": 1}, {"key": "38124131", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9626558729595737, "res": {"Yes": 0.9626558729595737, "No": 0.0373435975413244}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8231770696407332, "res": {"Yes": 0.8231770696407332, "No": 0.17681575867032048}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0017348614928159442, "res": {"No": 0.998264920893174, "Yes": 0.0017348614928159442}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5180449471122633, "res": {"Yes": 0.5180449471122633, "No": 0.4819527012178733}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8936710183104966, "res": {"Yes": 0.8936710183104966, "No": 0.10632740699584194}, "ground_truth": 1}, {"key": "20285901", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8621063759136681, "res": {"Yes": 0.8621063759136681, "No": 0.13789138071719972}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.001194559238155334, "res": {"No": 0.9988051279287906, "Yes": 0.001194559238155334}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9524582709187737, "res": {"Yes": 0.9524582709187737, "No": 0.04754073768628458}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9892997958608946, "res": {"Yes": 0.9892997958608946, "No": 0.010699727554871336}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998786930064902, "res": {"Yes": 0.998786930064902, "No": 0.0012128115738980008}, "ground_truth": 1}, {"key": "35633632", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9613698139774169, "res": {"Yes": 0.9613698139774169, "No": 0.0386296060650101}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9931901101093984, "res": {"Yes": 0.9931901101093984, "No": 0.00680943791776686}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9992372416481606, "res": {"Yes": 0.9992372416481606, "No": 0.0007626037447876164}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9983321581965542, "res": {"Yes": 0.9983321581965542, "No": 0.0016676146948852932}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995569162406144, "res": {"Yes": 0.9995569162406144, "No": 0.00044296668230114076}, "ground_truth": 1}, {"key": "10741274", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998984884226488, "res": {"Yes": 0.9998984884226488, "No": 0.00010131551494968752}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993307952874216, "res": {"Yes": 0.9993307952874216, "No": 0.0006690215406990944}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.701010916020222, "res": {"Yes": 0.701010916020222, "No": 0.29898705525206337}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6967469152298691, "res": {"Yes": 0.6967469152298691, "No": 0.3032515560276488}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7268226710335967, "res": {"Yes": 0.7268226710335967, "No": 0.2731752358936333}, "ground_truth": 1}, {"key": "30605795", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9900136520490961, "res": {"Yes": 0.9900136520490961, "No": 0.009975567755314026}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8009310063644686, "res": {"Yes": 0.8009310063644686, "No": 0.1990635218333639}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9902677300701533, "res": {"Yes": 0.9902677300701533, "No": 0.009732011231326776}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981972119780178, "res": {"Yes": 0.9981972119780178, "No": 0.0018017850698910846}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.986065422658541, "res": {"Yes": 0.986065422658541, "No": 0.013933776812189715}, "ground_truth": 1}, {"key": "30539722", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9715252215988396, "res": {"Yes": 0.9715252215988396, "No": 0.028474520759785082}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.997904990901428, "res": {"Yes": 0.997904990901428, "No": 0.002094507158127645}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.17075137975628338, "res": {"No": 0.8292386486029572, "Yes": 0.17075137975628338}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993554432160282, "res": {"Yes": 0.9993554432160282, "No": 0.0006437365496192157}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992508095833891, "res": {"Yes": 0.9992508095833891, "No": 0.0007489143001640629}, "ground_truth": 1}, {"key": "18639299", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994706987293668, "res": {"Yes": 0.9994706987293668, "No": 0.0005291966796632784}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989194242429005, "res": {"Yes": 0.9989194242429005, "No": 0.0010803189039476305}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9976625278526384, "res": {"Yes": 0.9976625278526384, "No": 0.002334482592990035}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999375840279578, "res": {"Yes": 0.9999375840279578, "No": 6.1845637200809e-05}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974436584202979, "res": {"Yes": 0.9974436584202979, "No": 0.002555748866083367}, "ground_truth": 1}, {"key": "39773552", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999309090568892, "res": {"Yes": 0.9999309090568892, "No": 6.892862562303037e-05}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993769908008738, "res": {"Yes": 0.9993769908008738, "No": 0.0006218153961697825}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1421052924537727, "res": {"No": 0.857894257582539, "Yes": 0.1421052924537727}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9967679902246802, "res": {"Yes": 0.9967679902246802, "No": 0.0032316491477057683}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990075782764937, "res": {"Yes": 0.9990075782764937, "No": 0.0009913528822350583}, "ground_truth": 1}, {"key": "34086410", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971202285198512, "res": {"Yes": 0.9971202285198512, "No": 0.002879156239946016}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988650707199379, "res": {"Yes": 0.9988650707199379, "No": 0.0011343029019960128}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9981946016957214, "res": {"Yes": 0.9981946016957214, "No": 0.0018046139286853836}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998864501472726, "res": {"Yes": 0.9998864501472726, "No": 0.0001133665708287076}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990995475508377, "res": {"Yes": 0.9990995475508377, "No": 0.0009001411262395965}, "ground_truth": 1}, {"key": "35454652", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9985925438966821, "res": {"Yes": 0.9985925438966821, "No": 0.0014073637577096017}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998175716220805, "res": {"Yes": 0.9998175716220805, "No": 0.0001822489405975902}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0002799991473439052, "res": {"No": 0.9997191578835323, "Yes": 0.0002799991473439052}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981730942276238, "res": {"Yes": 0.9981730942276238, "No": 0.001825853920017403}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996151606896513, "res": {"Yes": 0.9996151606896513, "No": 0.0003843166637604838}, "ground_truth": 1}, {"key": "36158310", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995682319786514, "res": {"Yes": 0.9995682319786514, "No": 0.000431264917031052}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998160259453023, "res": {"Yes": 0.9998160259453023, "No": 0.00018325462110970963}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 3.255173135807507e-05, "res": {"No": 0.9999655955278475, "Yes": 3.255173135807507e-05}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.1854779076970337, "res": {"No": 0.8145112735236782, "Yes": 0.1854779076970337}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9604501616910183, "res": {"Yes": 0.9604501616910183, "No": 0.03954916094649354}, "ground_truth": 1}, {"key": "35688387", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9862568316019105, "res": {"Yes": 0.9862568316019105, "No": 0.013742679453890008}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8866000981210771, "res": {"Yes": 0.8866000981210771, "No": 0.11339651727735574}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.625439510241577, "res": {"Yes": 0.625439510241577, "No": 0.374559889594537}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998420042226477, "res": {"Yes": 0.9998420042226477, "No": 0.00015787641729659183}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998480789911653, "res": {"Yes": 0.9998480789911653, "No": 0.00015180435566030477}, "ground_truth": 1}, {"key": "34209292", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996009883763198, "res": {"Yes": 0.9996009883763198, "No": 0.00039884527429650206}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997724100525223, "res": {"Yes": 0.9997724100525223, "No": 0.000226985595146679}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9006932899833249, "res": {"Yes": 0.9006932899833249, "No": 0.09930589938278261}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9965965073564745, "res": {"Yes": 0.9965965073564745, "No": 0.003403379739711786}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998992035803005, "res": {"Yes": 0.9998992035803005, "No": 0.00010061642935146516}, "ground_truth": 1}, {"key": "25037859", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999385375988907, "res": {"Yes": 0.9999385375988907, "No": 6.128600772802877e-05}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998269870484672, "res": {"Yes": 0.9998269870484672, "No": 0.0001728110079861078}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.19494907663194755, "res": {"No": 0.805047851880858, "Yes": 0.19494907663194755}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978235598879204, "res": {"Yes": 0.9978235598879204, "No": 0.002173822805097152}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986963283192045, "res": {"Yes": 0.9986963283192045, "No": 0.001301167943205527}, "ground_truth": 1}, {"key": "36412121", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968888121067725, "res": {"Yes": 0.9968888121067725, "No": 0.0031098359605063438}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985395211387905, "res": {"Yes": 0.9985395211387905, "No": 0.001458027768451318}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8885924988972808, "res": {"Yes": 0.8885924988972808, "No": 0.11140679020280378}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9951528322177559, "res": {"Yes": 0.9951528322177559, "No": 0.004847059725678272}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9871315428484589, "res": {"Yes": 0.9871315428484589, "No": 0.012865087910041399}, "ground_truth": 1}, {"key": "34909172", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996852022792035, "res": {"Yes": 0.9996852022792035, "No": 0.00031412926022371374}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9964419174310178, "res": {"Yes": 0.9964419174310178, "No": 0.0035573681188055123}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.011331445844911173, "res": {"No": 0.9886678283035916, "Yes": 0.011331445844911173}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.12437040859548273, "res": {"No": 0.8756265865383766, "Yes": 0.12437040859548273}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.03219074146242228, "res": {"No": 0.9678077923920315, "Yes": 0.03219074146242228}, "ground_truth": 1}, {"key": "39011806", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06584966092558195, "res": {"No": 0.934147304118257, "Yes": 0.06584966092558195}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0949933490340801, "res": {"No": 0.9049994346305775, "Yes": 0.0949933490340801}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.981100115586137, "res": {"Yes": 0.981100115586137, "No": 0.018899855546274647}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989245407212948, "res": {"Yes": 0.9989245407212948, "No": 0.0010752257924170378}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994658176262344, "res": {"Yes": 0.9994658176262344, "No": 0.0005340244145062775}, "ground_truth": 1}, {"key": "33096163", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997403667405498, "res": {"Yes": 0.9997403667405498, "No": 0.0002595954760250941}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992092651557002, "res": {"Yes": 0.9992092651557002, "No": 0.0007906011124553778}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995609637046521, "res": {"Yes": 0.9995609637046521, "No": 0.00043851128983300226}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997824209237612, "res": {"Yes": 0.9997824209237612, "No": 0.00021641082264928075}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997758661717403, "res": {"Yes": 0.9997758661717403, "No": 0.00022303652738169108}, "ground_truth": 1}, {"key": "38762205", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995601296513408, "res": {"Yes": 0.9995601296513408, "No": 0.0004387050230525531}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997965995086854, "res": {"Yes": 0.9997965995086854, "No": 0.00020230036693016614}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004486405296485716, "res": {"No": 0.9955130388237245, "Yes": 0.004486405296485716}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6016614303142177, "res": {"Yes": 0.6016614303142177, "No": 0.3983343703097297}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9938742626051426, "res": {"Yes": 0.9938742626051426, "No": 0.006123659522332516}, "ground_truth": 1}, {"key": "35519177", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8869771446750202, "res": {"Yes": 0.8869771446750202, "No": 0.11302187442742873}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9584293961323318, "res": {"Yes": 0.9584293961323318, "No": 0.04156700813675016}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9890228930034265, "res": {"Yes": 0.9890228930034265, "No": 0.010974568910696047}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981757118401783, "res": {"Yes": 0.9981757118401783, "No": 0.0018238474968656011}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980723932248455, "res": {"Yes": 0.9980723932248455, "No": 0.0019276082370342498}, "ground_truth": 1}, {"key": "36192531", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994652219447846, "res": {"Yes": 0.9994652219447846, "No": 0.0005344745731031242}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999768477225535, "res": {"Yes": 0.999768477225535, "No": 0.00023133978441366483}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9994411669653781, "res": {"Yes": 0.9994411669653781, "No": 0.0005585258811852833}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998617854325136, "res": {"Yes": 0.9998617854325136, "No": 0.00013809164486427625}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999661915245194, "res": {"Yes": 0.9999661915245194, "No": 3.365201912361953e-05}, "ground_truth": 1}, {"key": "33160852", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999963211539712, "res": {"Yes": 0.999963211539712, "No": 3.664853878012855e-05}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9958483271216463, "res": {"Yes": 0.9958483271216463, "No": 0.004150960606828461}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9367831627625869, "res": {"Yes": 0.9367831627625869, "No": 0.0632163821616682}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9726154858725933, "res": {"Yes": 0.9726154858725933, "No": 0.027384095234988064}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991629656088916, "res": {"Yes": 0.9991629656088916, "No": 0.0008367021542230719}, "ground_truth": 1}, {"key": "36312304", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9979625680879273, "res": {"Yes": 0.9979625680879273, "No": 0.002037336421497073}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990523077442216, "res": {"Yes": 0.9990523077442216, "No": 0.0009470089631873691}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9963743232962562, "res": {"Yes": 0.9963743232962562, "No": 0.0036254868363867474}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989701037076004, "res": {"Yes": 0.9989701037076004, "No": 0.0010297636181714118}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9978897976142315, "res": {"Yes": 0.9978897976142315, "No": 0.0021098074322405008}, "ground_truth": 1}, {"key": "33773343", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978026772558504, "res": {"Yes": 0.9978026772558504, "No": 0.0021970362191170677}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999008722634788, "res": {"Yes": 0.9999008722634788, "No": 9.901591135364396e-05}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.017737977792532368, "res": {"No": 0.9822606462171142, "Yes": 0.017737977792532368}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7857239947018266, "res": {"Yes": 0.7857239947018266, "No": 0.21427140925188962}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9566007095448639, "res": {"Yes": 0.9566007095448639, "No": 0.04339836983442519}, "ground_truth": 1}, {"key": "34913320", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9725879699971101, "res": {"Yes": 0.9725879699971101, "No": 0.027409341309089248}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.23104492658259945, "res": {"No": 0.7689425420640934, "Yes": 0.23104492658259945}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9975690314016018, "res": {"Yes": 0.9975690314016018, "No": 0.0024306513798481675}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9530231213259979, "res": {"Yes": 0.9530231213259979, "No": 0.046972239533352535}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996377862852326, "res": {"Yes": 0.9996377862852326, "No": 0.00036163975267271953}, "ground_truth": 1}, {"key": "33784155", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999111228098115, "res": {"Yes": 0.9999111228098115, "No": 8.84097765481239e-05}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999552745967917, "res": {"Yes": 0.999552745967917, "No": 0.0004462892381984088}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9959579275553734, "res": {"Yes": 0.9959579275553734, "No": 0.004039085395059803}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9795397602767532, "res": {"Yes": 0.9795397602767532, "No": 0.02045899786220744}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.960187406949442, "res": {"Yes": 0.960187406949442, "No": 0.03979664765552296}, "ground_truth": 1}, {"key": "24085062", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8741571622361728, "res": {"Yes": 0.8741571622361728, "No": 0.12582144251446978}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9804059386225333, "res": {"Yes": 0.9804059386225333, "No": 0.01959326684659413}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004311756143354576, "res": {"No": 0.9956881548131273, "Yes": 0.004311756143354576}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9972942518529395, "res": {"Yes": 0.9972942518529395, "No": 0.0027057054658563844}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987008484290155, "res": {"Yes": 0.9987008484290155, "No": 0.0012984270612282395}, "ground_truth": 1}, {"key": "33893487", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9533820697763654, "res": {"Yes": 0.9533820697763654, "No": 0.04661768049706387}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0575178353082825, "res": {"No": 0.942481397740603, "Yes": 0.0575178353082825}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06916128764441973, "res": {"No": 0.930834130785006, "Yes": 0.06916128764441973}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0005414726503505287, "res": {"No": 0.9994579580578408, "Yes": 0.0005414726503505287}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9288640695319331, "res": {"Yes": 0.9288640695319331, "No": 0.07113427434695939}, "ground_truth": 1}, {"key": "40913011", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3961798516494768, "res": {"No": 0.6038072406375486, "Yes": 0.3961798516494768}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.10079110210590671, "res": {"No": 0.8992019277454316, "Yes": 0.10079110210590671}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9720970245572398, "res": {"Yes": 0.9720970245572398, "No": 0.027902717317637236}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9929749548072527, "res": {"Yes": 0.9929749548072527, "No": 0.0070247918085153726}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9451503401840851, "res": {"Yes": 0.9451503401840851, "No": 0.054848803858552876}, "ground_truth": 1}, {"key": "29642545", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9853217533523293, "res": {"Yes": 0.9853217533523293, "No": 0.014677034290694143}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9929833003996286, "res": {"Yes": 0.9929833003996286, "No": 0.007016228893102055}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996597084123208, "res": {"Yes": 0.9996597084123208, "No": 0.0003399880799293407}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989755740828662, "res": {"Yes": 0.9989755740828662, "No": 0.0010242337570983671}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990678940808556, "res": {"Yes": 0.9990678940808556, "No": 0.0009316442706410894}, "ground_truth": 1}, {"key": "35969159", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993642513738502, "res": {"Yes": 0.9993642513738502, "No": 0.000635580120841448}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9979432140889439, "res": {"Yes": 0.9979432140889439, "No": 0.0020566846208958027}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0022371355584198003, "res": {"No": 0.9977586458937087, "Yes": 0.0022371355584198003}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9958933669740897, "res": {"Yes": 0.9958933669740897, "No": 0.004102691734817944}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997081979225102, "res": {"Yes": 0.9997081979225102, "No": 0.00029149229056059085}, "ground_truth": 1}, {"key": "37081669", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980617040265616, "res": {"Yes": 0.9980617040265616, "No": 0.0019375468817446869}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988481815526753, "res": {"Yes": 0.9988481815526753, "No": 0.0011513420695983365}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4384175553553937, "res": {"No": 0.5615773265712414, "Yes": 0.4384175553553937}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9976490033317836, "res": {"Yes": 0.9976490033317836, "No": 0.00234949586352423}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9951458621917281, "res": {"Yes": 0.9951458621917281, "No": 0.004852132402698903}, "ground_truth": 1}, {"key": "40048022", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7953708779234162, "res": {"Yes": 0.7953708779234162, "No": 0.2046175197201158}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7777414783988996, "res": {"Yes": 0.7777414783988996, "No": 0.22225617965562136}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9928198229308957, "res": {"Yes": 0.9928198229308957, "No": 0.007180117723685085}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998023201312406, "res": {"Yes": 0.9998023201312406, "No": 0.0001960362435024021}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9918473684350251, "res": {"Yes": 0.9918473684350251, "No": 0.008152048774064998}, "ground_truth": 1}, {"key": "32884004", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9673093865251262, "res": {"Yes": 0.9673093865251262, "No": 0.032688684523531034}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9902221401835931, "res": {"Yes": 0.9902221401835931, "No": 0.00977695688800881}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9922272582071087, "res": {"Yes": 0.9922272582071087, "No": 0.007772225760191952}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989102626954137, "res": {"Yes": 0.9989102626954137, "No": 0.0010895418415034005}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.979697633666378, "res": {"Yes": 0.979697633666378, "No": 0.02030166249464058}, "ground_truth": 1}, {"key": "39022490", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1285799743185387, "res": {"No": 0.8714176680744824, "Yes": 0.1285799743185387}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7247964660674561, "res": {"Yes": 0.7247964660674561, "No": 0.2752014235920775}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3475873425818545, "res": {"No": 0.6524103264224198, "Yes": 0.3475873425818545}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6029595293579001, "res": {"Yes": 0.6029595293579001, "No": 0.3970387484139526}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.25008655526014123, "res": {"No": 0.7499116570422297, "Yes": 0.25008655526014123}, "ground_truth": 1}, {"key": "35159385", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.982800139886959, "res": {"Yes": 0.982800139886959, "No": 0.017199121019259217}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.3872106572767282, "res": {"No": 0.6127850849700794, "Yes": 0.3872106572767282}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2717251504087652, "res": {"No": 0.7282735397090301, "Yes": 0.2717251504087652}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9948655681881075, "res": {"Yes": 0.9948655681881075, "No": 0.005130413596243024}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9581755264789772, "res": {"Yes": 0.9581755264789772, "No": 0.04181870715391686}, "ground_truth": 1}, {"key": "34363669", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9946139610012937, "res": {"Yes": 0.9946139610012937, "No": 0.005384582508377446}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9913682974142578, "res": {"Yes": 0.9913682974142578, "No": 0.008630248322215671}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.009305574032807665, "res": {"No": 0.9906912075796396, "Yes": 0.009305574032807665}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9682608740771905, "res": {"Yes": 0.9682608740771905, "No": 0.03173687579144416}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9539806535854616, "res": {"Yes": 0.9539806535854616, "No": 0.046015287534429294}, "ground_truth": 1}, {"key": "36119687", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.38660831670903173, "res": {"No": 0.6133905827273286, "Yes": 0.38660831670903173}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983219458099758, "res": {"Yes": 0.9983219458099758, "No": 0.001676777470394162}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.14562355171738064, "res": {"No": 0.8543676878662048, "Yes": 0.14562355171738064}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996458892320231, "res": {"Yes": 0.9996458892320231, "No": 0.0003526688652730396}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976288306738269, "res": {"Yes": 0.9976288306738269, "No": 0.0023697448212277633}, "ground_truth": 1}, {"key": "35217446", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974397530370432, "res": {"Yes": 0.9974397530370432, "No": 0.0025590274372447657}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992327153135552, "res": {"Yes": 0.9992327153135552, "No": 0.0007666749809933591}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9961434815417719, "res": {"Yes": 0.9961434815417719, "No": 0.003856458514272325}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9496392075966601, "res": {"Yes": 0.9496392075966601, "No": 0.05036033589254986}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976932566310205, "res": {"Yes": 0.9976932566310205, "No": 0.002306291397963651}, "ground_truth": 1}, {"key": "39049331", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9878295760396941, "res": {"Yes": 0.9878295760396941, "No": 0.012170166389166903}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.22673553154114875, "res": {"No": 0.7732617824224294, "Yes": 0.22673553154114875}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9993555623791783, "res": {"Yes": 0.9993555623791783, "No": 0.0006443533514211851}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6884710841672698, "res": {"Yes": 0.6884710841672698, "No": 0.3115185163453743}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7116841325954432, "res": {"Yes": 0.7116841325954432, "No": 0.28831195729954096}, "ground_truth": 1}, {"key": "36472242", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9932887760324933, "res": {"Yes": 0.9932887760324933, "No": 0.006710800738644566}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9873198758964647, "res": {"Yes": 0.9873198758964647, "No": 0.012678875713904345}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7011715921131257, "res": {"Yes": 0.7011715921131257, "No": 0.29882749855144186}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.996442378185867, "res": {"Yes": 0.996442378185867, "No": 0.0035571119975214374}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9979689809161976, "res": {"Yes": 0.9979689809161976, "No": 0.0020299942874427725}, "ground_truth": 1}, {"key": "31854721", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9935764314942747, "res": {"Yes": 0.9935764314942747, "No": 0.00642308337561887}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9908670986206692, "res": {"Yes": 0.9908670986206692, "No": 0.009132431500066998}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0038402047250059457, "res": {"No": 0.9961542583783215, "Yes": 0.0038402047250059457}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9654758696696943, "res": {"Yes": 0.9654758696696943, "No": 0.034523456065708995}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9972616440553338, "res": {"Yes": 0.9972616440553338, "No": 0.0027381466296194073}, "ground_truth": 1}, {"key": "18725849", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.995572823964257, "res": {"Yes": 0.995572823964257, "No": 0.004427034642438196}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977165121341695, "res": {"Yes": 0.9977165121341695, "No": 0.002283234958894685}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9943677847318815, "res": {"Yes": 0.9943677847318815, "No": 0.005631986821847276}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978258162688874, "res": {"Yes": 0.9978258162688874, "No": 0.002174101072224921}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9904524599574205, "res": {"Yes": 0.9904524599574205, "No": 0.009547413489201738}, "ground_truth": 1}, {"key": "36883179", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9944228270974775, "res": {"Yes": 0.9944228270974775, "No": 0.005577115342334942}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997552597537814, "res": {"Yes": 0.9997552597537814, "No": 0.00024443527696068636}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.998833316405113, "res": {"Yes": 0.998833316405113, "No": 0.0011662346123689372}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974558793743562, "res": {"Yes": 0.9974558793743562, "No": 0.0025431278971508073}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9959697559207469, "res": {"Yes": 0.9959697559207469, "No": 0.004029792069549225}, "ground_truth": 1}, {"key": "34266359", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9321484647881215, "res": {"Yes": 0.9321484647881215, "No": 0.0678455486908012}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8864925440946249, "res": {"Yes": 0.8864925440946249, "No": 0.11350481727611399}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9950936974158108, "res": {"Yes": 0.9950936974158108, "No": 0.004905962386557677}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9915469992274939, "res": {"Yes": 0.9915469992274939, "No": 0.008452588949356351}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998697710105311, "res": {"Yes": 0.9998697710105311, "No": 0.00012990579812337147}, "ground_truth": 1}, {"key": "31920289", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999360915801355, "res": {"Yes": 0.999360915801355, "No": 0.0006388377807862362}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.991206520796382, "res": {"Yes": 0.991206520796382, "No": 0.008793225355038046}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.10256679849797022, "res": {"No": 0.897427358051093, "Yes": 0.10256679849797022}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9735073997670042, "res": {"Yes": 0.9735073997670042, "No": 0.026489617902999977}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9952128109907312, "res": {"Yes": 0.9952128109907312, "No": 0.004785398387342951}, "ground_truth": 1}, {"key": "36292997", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975181541845214, "res": {"Yes": 0.9975181541845214, "No": 0.0024813028847568484}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.25561593881290934, "res": {"No": 0.7443819516557314, "Yes": 0.25561593881290934}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9848366117155289, "res": {"Yes": 0.9848366117155289, "No": 0.015162933725148488}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9955408058615354, "res": {"Yes": 0.9955408058615354, "No": 0.004458889210105164}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996910414375295, "res": {"Yes": 0.9996910414375295, "No": 0.0003086254969789075}, "ground_truth": 1}, {"key": "30412533", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993917483001111, "res": {"Yes": 0.9993917483001111, "No": 0.0006081782163210367}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991840362396287, "res": {"Yes": 0.9991840362396287, "No": 0.0008158418769705153}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7136535203773063, "res": {"Yes": 0.7136535203773063, "No": 0.2863427382968175}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9945450883583963, "res": {"Yes": 0.9945450883583963, "No": 0.005453749092094976}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9019242342076499, "res": {"Yes": 0.9019242342076499, "No": 0.098075224286652}, "ground_truth": 1}, {"key": "40433191", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9934692324672059, "res": {"Yes": 0.9934692324672059, "No": 0.0065307009396977506}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9962701934725737, "res": {"Yes": 0.9962701934725737, "No": 0.0037285420240873376}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9547236166851409, "res": {"Yes": 0.9547236166851409, "No": 0.04527513017544032}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9975129331881658, "res": {"Yes": 0.9975129331881658, "No": 0.0024867864110903457}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.989568094725592, "res": {"Yes": 0.989568094725592, "No": 0.010430683291362382}, "ground_truth": 1}, {"key": "34565591", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9983490351443405, "res": {"Yes": 0.9983490351443405, "No": 0.0016499636856645396}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.22809462823795196, "res": {"No": 0.7719021389581868, "Yes": 0.22809462823795196}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.046303487349632876, "res": {"No": 0.9536957373494029, "Yes": 0.046303487349632876}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9957984383618281, "res": {"Yes": 0.9957984383618281, "No": 0.004199632321604499}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9223601808766717, "res": {"Yes": 0.9223601808766717, "No": 0.07763760256671401}, "ground_truth": 1}, {"key": "36062480", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9523048498687785, "res": {"Yes": 0.9523048498687785, "No": 0.04769290663536185}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.19129720752550497, "res": {"No": 0.8087008482299924, "Yes": 0.19129720752550497}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1489239062194971, "res": {"No": 0.8510750788795532, "Yes": 0.1489239062194971}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9785534051947054, "res": {"Yes": 0.9785534051947054, "No": 0.02144476541471314}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988496065105075, "res": {"Yes": 0.9988496065105075, "No": 0.0011500354626447957}, "ground_truth": 1}, {"key": "37276883", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9960467410834658, "res": {"Yes": 0.9960467410834658, "No": 0.003952665964535066}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989063406817488, "res": {"Yes": 0.9989063406817488, "No": 0.0010930470762917704}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08734674560944669, "res": {"No": 0.9126528506423992, "Yes": 0.08734674560944669}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6381785665009903, "res": {"Yes": 0.6381785665009903, "No": 0.36181747754050875}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9567875930498665, "res": {"Yes": 0.9567875930498665, "No": 0.043210411751706534}, "ground_truth": 1}, {"key": "38509260", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6358033700702869, "res": {"Yes": 0.6358033700702869, "No": 0.3641861285011715}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7821170964037099, "res": {"Yes": 0.7821170964037099, "No": 0.2178482193925877}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.13449586821542736, "res": {"No": 0.8654971216684493, "Yes": 0.13449586821542736}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8781456857601014, "res": {"Yes": 0.8781456857601014, "No": 0.12185188855693108}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9015057302576085, "res": {"Yes": 0.9015057302576085, "No": 0.09849112858372988}, "ground_truth": 1}, {"key": "37139607", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.48209041477605624, "res": {"No": 0.5179024680854125, "Yes": 0.48209041477605624}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.045745671671933476, "res": {"No": 0.9542480431757308, "Yes": 0.045745671671933476}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.018488543666307436, "res": {"No": 0.9815083283235413, "Yes": 0.018488543666307436}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8856160716495063, "res": {"Yes": 0.8856160716495063, "No": 0.11438094255169788}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.48221104888853145, "res": {"No": 0.5177811584627897, "Yes": 0.48221104888853145}, "ground_truth": 1}, {"key": "37092824", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.27000340741711654, "res": {"No": 0.7299915647817165, "Yes": 0.27000340741711654}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7728103757472355, "res": {"Yes": 0.7728103757472355, "No": 0.227186548371329}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8837959630631425, "res": {"Yes": 0.8837959630631425, "No": 0.11620199105343257}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0009982038939146886, "res": {"No": 0.9990015123208946, "Yes": 0.0009982038939146886}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4498755455110819, "res": {"No": 0.5501235222842009, "Yes": 0.4498755455110819}, "ground_truth": 1}, {"key": "32191802", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004576816087525838, "res": {"No": 0.9954227850241921, "Yes": 0.004576816087525838}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.021920337941103898, "res": {"No": 0.9780792103980188, "Yes": 0.021920337941103898}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9082460017840602, "res": {"Yes": 0.9082460017840602, "No": 0.09175154068328979}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999582999628833, "res": {"Yes": 0.999582999628833, "No": 0.0004159331532158123}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9852644644698209, "res": {"Yes": 0.9852644644698209, "No": 0.014731989398846568}, "ground_truth": 1}, {"key": "39396038", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989452381527357, "res": {"Yes": 0.9989452381527357, "No": 0.0010538158073178175}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9895287641337212, "res": {"Yes": 0.9895287641337212, "No": 0.010469531520905106}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9943102666937856, "res": {"Yes": 0.9943102666937856, "No": 0.005689334484424933}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999741779333953, "res": {"Yes": 0.9999741779333953, "No": 2.5504695130084355e-05}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992796063082231, "res": {"Yes": 0.9992796063082231, "No": 0.0007185679391437279}, "ground_truth": 1}, {"key": "39076884", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997502544316179, "res": {"Yes": 0.9997502544316179, "No": 0.00024946722852422126}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996009883763198, "res": {"Yes": 0.9996009883763198, "No": 0.0003980502517387165}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9959217457582695, "res": {"Yes": 0.9959217457582695, "No": 0.004078124816562333}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974427216216538, "res": {"Yes": 0.9974427216216538, "No": 0.0025571216717897955}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9808186224304161, "res": {"Yes": 0.9808186224304161, "No": 0.019180122935118865}, "ground_truth": 1}, {"key": "27763432", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9939470368422739, "res": {"Yes": 0.9939470368422739, "No": 0.0060524350518913195}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9927737701651821, "res": {"Yes": 0.9927737701651821, "No": 0.007225889054702546}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3832697230239605, "res": {"No": 0.6167278982794705, "Yes": 0.3832697230239605}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7794562794486601, "res": {"Yes": 0.7794562794486601, "No": 0.22053446333596513}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3939691272451913, "res": {"No": 0.6060273875240269, "Yes": 0.3939691272451913}, "ground_truth": 1}, {"key": "37806929", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8251735344326222, "res": {"Yes": 0.8251735344326222, "No": 0.17482181915662967}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7680753796999104, "res": {"Yes": 0.7680753796999104, "No": 0.23192197002236453}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9989232308324033, "res": {"Yes": 0.9989232308324033, "No": 0.0010765217898291105}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.983442472984003, "res": {"Yes": 0.983442472984003, "No": 0.016555465334197134}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995364298518593, "res": {"Yes": 0.9995364298518593, "No": 0.0004632356361367392}, "ground_truth": 1}, {"key": "32334186", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999231613822378, "res": {"Yes": 0.9999231613822378, "No": 7.64545585121952e-05}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987826475753631, "res": {"Yes": 0.9987826475753631, "No": 0.0012162578137795122}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.09641493133428045, "res": {"No": 0.9035848995138349, "Yes": 0.09641493133428045}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.705489352455127, "res": {"Yes": 0.705489352455127, "No": 0.2945104772861193}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9633812425784545, "res": {"Yes": 0.9633812425784545, "No": 0.0366187087918883}, "ground_truth": 1}, {"key": "36187324", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9936446979055398, "res": {"Yes": 0.9936446979055398, "No": 0.006355135835386963}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984459992116134, "res": {"Yes": 0.9984459992116134, "No": 0.0015532014912385378}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9450457811504459, "res": {"Yes": 0.9450457811504459, "No": 0.05495373112904816}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981019633540571, "res": {"Yes": 0.9981019633540571, "No": 0.001897540509580204}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992885365602201, "res": {"Yes": 0.9992885365602201, "No": 0.00071098302732508}, "ground_truth": 1}, {"key": "35306009", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997652594858669, "res": {"Yes": 0.9997652594858669, "No": 0.0002341384385051176}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989446426816567, "res": {"Yes": 0.9989446426816567, "No": 0.0010550219569455672}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9992888939558291, "res": {"Yes": 0.9992888939558291, "No": 0.000711054129182846}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997601349322264, "res": {"Yes": 0.9997601349322264, "No": 0.0002397142425639051}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9942216386222371, "res": {"Yes": 0.9942216386222371, "No": 0.005777268418266841}, "ground_truth": 1}, {"key": "39490050", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.992911020697708, "res": {"Yes": 0.992911020697708, "No": 0.0070873228850796555}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996753152215149, "res": {"Yes": 0.9996753152215149, "No": 0.00032452791528127635}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999375840279578, "res": {"Yes": 0.9999375840279578, "No": 6.227173045004988e-05}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6973587254215202, "res": {"Yes": 0.6973587254215202, "No": 0.30263918246676863}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9876844310748246, "res": {"Yes": 0.9876844310748246, "No": 0.0123130820562159}, "ground_truth": 1}, {"key": "38072149", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99761115165044, "res": {"Yes": 0.99761115165044, "No": 0.0023881069452775256}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988908832251784, "res": {"Yes": 0.9988908832251784, "No": 0.001108647472353242}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1291230568825244, "res": {"No": 0.8708755796823339, "Yes": 0.1291230568825244}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8626961462410959, "res": {"Yes": 0.8626961462410959, "No": 0.13729421515225712}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3489777892229089, "res": {"No": 0.6510170478128052, "Yes": 0.3489777892229089}, "ground_truth": 1}, {"key": "35899689", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8684511424311946, "res": {"Yes": 0.8684511424311946, "No": 0.13154586564524576}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.07696680915440328, "res": {"No": 0.9230299190492826, "Yes": 0.07696680915440328}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0006673936541553772, "res": {"No": 0.9993323439115818, "Yes": 0.0006673936541553772}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992137913241281, "res": {"Yes": 0.9992137913241281, "No": 0.0007857881744589873}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9979219684034569, "res": {"Yes": 0.9979219684034569, "No": 0.0020772840161180114}, "ground_truth": 1}, {"key": "27994518", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.982012279621149, "res": {"Yes": 0.982012279621149, "No": 0.01798638852859217}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9938767400386047, "res": {"Yes": 0.9938767400386047, "No": 0.006122880030091057}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06933854656044254, "res": {"No": 0.930660118303108, "Yes": 0.06933854656044254}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999396103605277, "res": {"Yes": 0.9999396103605277, "No": 6.0313596422765285e-05}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996672120162093, "res": {"Yes": 0.9996672120162093, "No": 0.00033265488060221554}, "ground_truth": 1}, {"key": "10615479", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998681023692575, "res": {"Yes": 0.9998681023692575, "No": 0.00013161507420529053}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.793529002173934, "res": {"Yes": 0.793529002173934, "No": 0.2064689171885464}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9950613534159275, "res": {"Yes": 0.9950613534159275, "No": 0.004938285859509927}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998273446066582, "res": {"Yes": 0.9998273446066582, "No": 0.00017220894877265856}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980929356624362, "res": {"Yes": 0.9980929356624362, "No": 0.0019061713070656304}, "ground_truth": 1}, {"key": "40186667", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998998892342964, "res": {"Yes": 0.998998892342964, "No": 0.0010007175362882225}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9837557109317797, "res": {"Yes": 0.9837557109317797, "No": 0.016243279905765254}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.005079108626562628, "res": {"No": 0.9949204343483489, "Yes": 0.005079108626562628}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8515043502219164, "res": {"Yes": 0.8515043502219164, "No": 0.14849118244159099}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9845297184699981, "res": {"Yes": 0.9845297184699981, "No": 0.0154702106161578}, "ground_truth": 1}, {"key": "38622886", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994081811938751, "res": {"Yes": 0.9994081811938751, "No": 0.0005893389929847485}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992218871869053, "res": {"Yes": 0.9992218871869053, "No": 0.0007776624475338969}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08073481371619583, "res": {"No": 0.9192641738418662, "Yes": 0.08073481371619583}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.23632589866785927, "res": {"No": 0.7636700460493963, "Yes": 0.23632589866785927}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980620609334907, "res": {"Yes": 0.9980620609334907, "No": 0.0019375108437078398}, "ground_truth": 1}, {"key": "40686943", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998968674781786, "res": {"Yes": 0.998968674781786, "No": 0.0010307526659118131}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9900191406999975, "res": {"Yes": 0.9900191406999975, "No": 0.009979462977263558}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9971500977036599, "res": {"Yes": 0.9971500977036599, "No": 0.0028497614213859757}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.05028659693041088, "res": {"No": 0.9497112385629457, "Yes": 0.05028659693041088}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.04693642746492876, "res": {"No": 0.9530631834479457, "Yes": 0.04693642746492876}, "ground_truth": 1}, {"key": "30604567", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7285363409245962, "res": {"Yes": 0.7285363409245962, "No": 0.27146260062974703}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.7973168546805198, "res": {"Yes": 0.7973168546805198, "No": 0.2026820467488635}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9998068489760613, "res": {"Yes": 0.9998068489760613, "No": 0.00019303153280413415}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999003954908585, "res": {"Yes": 0.9999003954908585, "No": 9.949521553810707e-05}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998496284069415, "res": {"Yes": 0.9998496284069415, "No": 0.00015003019261844238}, "ground_truth": 1}, {"key": "35440903", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999859282501636, "res": {"Yes": 0.999859282501636, "No": 0.00014061512636305378}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.998589809654181, "res": {"Yes": 0.998589809654181, "No": 0.0014100793494074614}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9913131139382203, "res": {"Yes": 0.9913131139382203, "No": 0.00868637997624748}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990901426314592, "res": {"Yes": 0.9990901426314592, "No": 0.0009097673049487384}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9969990000297393, "res": {"Yes": 0.9969990000297393, "No": 0.0030003560920740043}, "ground_truth": 1}, {"key": "37219533", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998860315334429, "res": {"Yes": 0.998860315334429, "No": 0.0011392803361481474}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9964736268098854, "res": {"Yes": 0.9964736268098854, "No": 0.003526229885086371}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9954881166658621, "res": {"Yes": 0.9954881166658621, "No": 0.0045112793322756835}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9710560319003868, "res": {"Yes": 0.9710560319003868, "No": 0.02894007402221312}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99768211046422, "res": {"Yes": 0.99768211046422, "No": 0.0023152738608901006}, "ground_truth": 1}, {"key": "40178965", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997285687141387, "res": {"Yes": 0.9997285687141387, "No": 0.00027107256646385246}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9958957336178991, "res": {"Yes": 0.9958957336178991, "No": 0.004103202962056899}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9974991727916662, "res": {"Yes": 0.9974991727916662, "No": 0.002500544677095967}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9311649707818908, "res": {"Yes": 0.9311649707818908, "No": 0.06883310310336885}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9963266421468342, "res": {"Yes": 0.9963266421468342, "No": 0.0036720506968041}, "ground_truth": 1}, {"key": "13750468", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995195145701135, "res": {"Yes": 0.9995195145701135, "No": 0.0004803465670029486}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.98601547083556, "res": {"Yes": 0.98601547083556, "No": 0.013983223351172008}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9634843636084351, "res": {"Yes": 0.9634843636084351, "No": 0.03651452325998818}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997233288405262, "res": {"Yes": 0.9997233288405262, "No": 0.00027663599871608125}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9967118508421509, "res": {"Yes": 0.9967118508421509, "No": 0.0032874930353671387}, "ground_truth": 1}, {"key": "17754949", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9976427114786547, "res": {"Yes": 0.9976427114786547, "No": 0.002357039727636137}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998037502994923, "res": {"Yes": 0.9998037502994923, "No": 0.00019609839684237606}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9146190675583907, "res": {"Yes": 0.9146190675583907, "No": 0.08538037547238077}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.297148578785306, "res": {"No": 0.7028507599248968, "Yes": 0.297148578785306}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.21432125457846835, "res": {"No": 0.7856760355729175, "Yes": 0.21432125457846835}, "ground_truth": 1}, {"key": "36675623", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4540149962947877, "res": {"No": 0.5459841352380191, "Yes": 0.4540149962947877}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.2971461124623373, "res": {"No": 0.7028529739082775, "Yes": 0.2971461124623373}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.678948840243948, "res": {"Yes": 0.678948840243948, "No": 0.3210456673766797}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.00042354512373364773, "res": {"No": 0.9995754929286346, "Yes": 0.00042354512373364773}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8362413846119531, "res": {"Yes": 0.8362413846119531, "No": 0.16375800830225382}, "ground_truth": 1}, {"key": "40035440", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984847378706702, "res": {"Yes": 0.9984847378706702, "No": 0.00151353546096745}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8004231129022616, "res": {"Yes": 0.8004231129022616, "No": 0.19957271955936734}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.06737569058064587, "res": {"No": 0.9326224802282804, "Yes": 0.06737569058064587}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.0016431239524754948, "res": {"No": 0.9983566369023398, "Yes": 0.0016431239524754948}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9952966498558159, "res": {"Yes": 0.9952966498558159, "No": 0.004702860680482031}, "ground_truth": 1}, {"key": "37685909", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9895849071355542, "res": {"Yes": 0.9895849071355542, "No": 0.010412648602941438}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9933677031130491, "res": {"Yes": 0.9933677031130491, "No": 0.006631603160614444}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9497967287682196, "res": {"Yes": 0.9497967287682196, "No": 0.05020066526908772}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.993275839027079, "res": {"Yes": 0.993275839027079, "No": 0.006720578781207617}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9972838159213023, "res": {"Yes": 0.9972838159213023, "No": 0.002714753830154607}, "ground_truth": 1}, {"key": "36938787", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998709048295994, "res": {"Yes": 0.998709048295994, "No": 0.0012895280245475095}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996700719782239, "res": {"Yes": 0.9996700719782239, "No": 0.00032956135993771074}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9995066615314605, "res": {"Yes": 0.9995066615314605, "No": 0.0004925893462992705}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.908452664881742, "res": {"Yes": 0.908452664881742, "No": 0.0915468880726219}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997080398350736, "res": {"Yes": 0.997080398350736, "No": 0.0029192194794254627}, "ground_truth": 1}, {"key": "39398068", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.997793418288646, "res": {"Yes": 0.997793418288646, "No": 0.00220632068338713}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9660502572347512, "res": {"Yes": 0.9660502572347512, "No": 0.033948683613505434}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9910765325853428, "res": {"Yes": 0.9910765325853428, "No": 0.008923104096897365}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999797803764193, "res": {"Yes": 0.9999797803764193, "No": 2.0039464573374967e-05}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993236552243097, "res": {"Yes": 0.9993236552243097, "No": 0.0006762628676745941}, "ground_truth": 1}, {"key": "39926408", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998832320179115, "res": {"Yes": 0.9998832320179115, "No": 0.00011627493986887766}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998627389311626, "res": {"Yes": 0.9998627389311626, "No": 0.00013712015125918542}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9966522874273576, "res": {"Yes": 0.9966522874273576, "No": 0.0033475970132912087}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9940469246921838, "res": {"Yes": 0.9940469246921838, "No": 0.005952793344066262}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997502544316179, "res": {"Yes": 0.9997502544316179, "No": 0.0002492809460896651}, "ground_truth": 1}, {"key": "40465336", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995660872673711, "res": {"Yes": 0.9995660872673711, "No": 0.0004337554768670926}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5644802966928915, "res": {"Yes": 0.5644802966928915, "No": 0.43551819674146364}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9275036307063634, "res": {"Yes": 0.9275036307063634, "No": 0.0724846546155442}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.996864643428635, "res": {"Yes": 0.996864643428635, "No": 0.0031348322973385645}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9910603672678564, "res": {"Yes": 0.9910603672678564, "No": 0.008938357781633377}, "ground_truth": 1}, {"key": "34173549", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9970782808533425, "res": {"Yes": 0.9970782808533425, "No": 0.002921107365012172}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9785981564437302, "res": {"Yes": 0.9785981564437302, "No": 0.021399738000426532}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9993892575391485, "res": {"Yes": 0.9993892575391485, "No": 0.0006104383208903957}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8915507649520839, "res": {"Yes": 0.8915507649520839, "No": 0.10844740175449342}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9617181063499471, "res": {"Yes": 0.9617181063499471, "No": 0.03828148959555352}, "ground_truth": 1}, {"key": "33541535", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982627897994956, "res": {"Yes": 0.9982627897994956, "No": 0.0017369240803823153}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981337948303955, "res": {"Yes": 0.9981337948303955, "No": 0.0018659238250102077}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9575683927679036, "res": {"Yes": 0.9575683927679036, "No": 0.042427030842644514}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980140995149281, "res": {"Yes": 0.9980140995149281, "No": 0.0019851484137613186}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9358590794335487, "res": {"Yes": 0.9358590794335487, "No": 0.0641387547158454}, "ground_truth": 1}, {"key": "35685195", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9962563535824307, "res": {"Yes": 0.9962563535824307, "No": 0.003742668572248169}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990437369511999, "res": {"Yes": 0.9990437369511999, "No": 0.0009545338040237187}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.007701474307066872, "res": {"No": 0.9922982575841941, "Yes": 0.007701474307066872}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.995053443008129, "res": {"Yes": 0.995053443008129, "No": 0.0049459772973329905}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980770258884174, "res": {"Yes": 0.9980770258884174, "No": 0.001922219059812933}, "ground_truth": 1}, {"key": "28440730", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.976839437323835, "res": {"Yes": 0.976839437323835, "No": 0.023159426247690275}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9859720141473604, "res": {"Yes": 0.9859720141473604, "No": 0.014027540544290973}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.2565488459365783, "res": {"No": 0.743448286229959, "Yes": 0.2565488459365783}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7826328301370729, "res": {"Yes": 0.7826328301370729, "No": 0.21736576312988984}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9159094435026733, "res": {"Yes": 0.9159094435026733, "No": 0.08409022074808785}, "ground_truth": 1}, {"key": "38338714", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9720280771325998, "res": {"Yes": 0.9720280771325998, "No": 0.027970748816382004}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.21552195398216203, "res": {"No": 0.784476635434637, "Yes": 0.21552195398216203}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5720515896348758, "res": {"Yes": 0.5720515896348758, "No": 0.42790293350390807}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9774860923487958, "res": {"Yes": 0.9774860923487958, "No": 0.022512958550077383}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9943799236501437, "res": {"Yes": 0.9943799236501437, "No": 0.00561827838048274}, "ground_truth": 1}, {"key": "32191881", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8715434140015306, "res": {"Yes": 0.8715434140015306, "No": 0.12843966731011108}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9871785921396994, "res": {"Yes": 0.9871785921396994, "No": 0.012817057218220664}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.004756263014802842, "res": {"No": 0.9952435140781114, "Yes": 0.004756263014802842}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.6446816177153596, "res": {"Yes": 0.6446816177153596, "No": 0.3553174015829929}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9886924207330076, "res": {"Yes": 0.9886924207330076, "No": 0.011307285799672159}, "ground_truth": 1}, {"key": "37707251", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9239799192407834, "res": {"Yes": 0.9239799192407834, "No": 0.07601898251111637}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9967942841149399, "res": {"Yes": 0.9967942841149399, "No": 0.0032053002860599317}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.3236259193909456, "res": {"No": 0.6763726144425939, "Yes": 0.3236259193909456}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.4892307594997276, "res": {"No": 0.5107475868572109, "Yes": 0.4892307594997276}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9975765084090268, "res": {"Yes": 0.9975765084090268, "No": 0.0024213307336732343}, "ground_truth": 1}, {"key": "40172567", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9276220990353037, "res": {"Yes": 0.9276220990353037, "No": 0.07237011797072994}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.976584472529721, "res": {"Yes": 0.976584472529721, "No": 0.023415136658455182}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9822619103873794, "res": {"Yes": 0.9822619103873794, "No": 0.01773732682069279}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.993806680161122, "res": {"Yes": 0.993806680161122, "No": 0.006192917367514624}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9960088937196564, "res": {"Yes": 0.9960088937196564, "No": 0.003990694512278167}, "ground_truth": 1}, {"key": "33113255", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9693632929785794, "res": {"Yes": 0.9693632929785794, "No": 0.030635408453189353}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8305148826342055, "res": {"Yes": 0.8305148826342055, "No": 0.1694815004510079}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9997102201442953, "res": {"Yes": 0.9997102201442953, "No": 0.0002893171693021054}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9756923289481901, "res": {"Yes": 0.9756923289481901, "No": 0.024306171249341216}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998094709629628, "res": {"Yes": 0.9998094709629628, "No": 0.00019035210816376752}, "ground_truth": 1}, {"key": "33022143", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993035346046923, "res": {"Yes": 0.9993035346046923, "No": 0.0006959240688925859}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9986267827268999, "res": {"Yes": 0.9986267827268999, "No": 0.0013730482648138256}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9519674499540903, "res": {"Yes": 0.9519674499540903, "No": 0.048030886800745166}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5860632266020819, "res": {"Yes": 0.5860632266020819, "No": 0.413935588746084}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9701032032899424, "res": {"Yes": 0.9701032032899424, "No": 0.02989470214711372}, "ground_truth": 1}, {"key": "32084473", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9926928212031969, "res": {"Yes": 0.9926928212031969, "No": 0.0073044465487257775}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.016248267358231108, "res": {"No": 0.9837430215487047, "Yes": 0.016248267358231108}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.07804424262157303, "res": {"No": 0.9219538738861954, "Yes": 0.07804424262157303}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7918350017463509, "res": {"Yes": 0.7918350017463509, "No": 0.20816034642389505}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8795106990106546, "res": {"Yes": 0.8795106990106546, "No": 0.12048795374136306}, "ground_truth": 1}, {"key": "40564245", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.856596576862662, "res": {"Yes": 0.856596576862662, "No": 0.14339485931924806}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.48669341116946535, "res": {"No": 0.5132120840729711, "Yes": 0.48669341116946535}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9971934821553035, "res": {"Yes": 0.9971934821553035, "No": 0.0028059166554668252}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.999446047928135, "res": {"Yes": 0.999446047928135, "No": 0.0005533750923649186}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993405598862675, "res": {"Yes": 0.9993405598862675, "No": 0.0006592315628356508}, "ground_truth": 1}, {"key": "31717213", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998825168816821, "res": {"Yes": 0.9998825168816821, "No": 0.0001172475554377759}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995978903177775, "res": {"Yes": 0.9995978903177775, "No": 0.0004017437943549457}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8010628023948179, "res": {"Yes": 0.8010628023948179, "No": 0.19892925897385183}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9965940165659363, "res": {"Yes": 0.9965940165659363, "No": 0.0034047481734038915}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9708566576671621, "res": {"Yes": 0.9708566576671621, "No": 0.029140824038838498}, "ground_truth": 1}, {"key": "34861894", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7634055260214478, "res": {"Yes": 0.7634055260214478, "No": 0.23658945436682016}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.6230371382581865, "res": {"Yes": 0.6230371382581865, "No": 0.3769581521311424}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9989052689557107, "res": {"Yes": 0.9989052689557107, "No": 0.0010940053332436875}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994366397470112, "res": {"Yes": 0.9994366397470112, "No": 0.0005628865837166233}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998971773206141, "res": {"Yes": 0.9998971773206141, "No": 0.00010258621407461338}, "ground_truth": 1}, {"key": "40838760", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997074829414598, "res": {"Yes": 0.9997074829414598, "No": 0.00029190475220110067}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9973828222968756, "res": {"Yes": 0.9973828222968756, "No": 0.0026148103709075273}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.663646434158352, "res": {"Yes": 0.663646434158352, "No": 0.3363504017738541}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.998969508221699, "res": {"Yes": 0.998969508221699, "No": 0.0010302580233558863}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.996641862199961, "res": {"Yes": 0.996641862199961, "No": 0.003358075288301346}, "ground_truth": 1}, {"key": "40044849", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998080829467403, "res": {"Yes": 0.998080829467403, "No": 0.0019190250660583706}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9866146720177486, "res": {"Yes": 0.9866146720177486, "No": 0.01338500805790388}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9908464937535932, "res": {"Yes": 0.9908464937535932, "No": 0.009153375139543531}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9695818877183798, "res": {"Yes": 0.9695818877183798, "No": 0.030417548008059347}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998079216094166, "res": {"Yes": 0.9998079216094166, "No": 0.00019190636254049823}, "ground_truth": 1}, {"key": "30296116", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982740727284398, "res": {"Yes": 0.9982740727284398, "No": 0.0017258537903829402}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988638836693932, "res": {"Yes": 0.9988638836693932, "No": 0.0011357042907584262}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.16262323425164332, "res": {"No": 0.8373749163912132, "Yes": 0.16262323425164332}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8845491489461191, "res": {"Yes": 0.8845491489461191, "No": 0.11543602483623101}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991019221635093, "res": {"Yes": 0.9991019221635093, "No": 0.0008937688261090014}, "ground_truth": 1}, {"key": "34931360", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9765046624718973, "res": {"Yes": 0.9765046624718973, "No": 0.023484872230279716}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9952573288506364, "res": {"Yes": 0.9952573288506364, "No": 0.0047327469240649265}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9799514787723871, "res": {"Yes": 0.9799514787723871, "No": 0.020047845246645542}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998453414008744, "res": {"Yes": 0.9998453414008744, "No": 0.00015453839209057349}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999353192918872, "res": {"Yes": 0.9999353192918872, "No": 6.395652514750064e-05}, "ground_truth": 1}, {"key": "18862422", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984250777936532, "res": {"Yes": 0.9984250777936532, "No": 0.0015748809450595862}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999680987188567, "res": {"Yes": 0.9999680987188567, "No": 3.119368149013089e-05}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9860906968252888, "res": {"Yes": 0.9860906968252888, "No": 0.013908797853030482}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9966355838743253, "res": {"Yes": 0.9966355838743253, "No": 0.003363937890608877}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980361836156548, "res": {"Yes": 0.9980361836156548, "No": 0.001962985009976411}, "ground_truth": 1}, {"key": "36361140", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990822934005053, "res": {"Yes": 0.9990822934005053, "No": 0.0009170216283491201}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994493837447982, "res": {"Yes": 0.9994493837447982, "No": 0.0005501503243951367}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.984081954799717, "res": {"Yes": 0.984081954799717, "No": 0.015917247647118864}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9942667723379371, "res": {"Yes": 0.9942667723379371, "No": 0.0057328969505715845}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9955373792159788, "res": {"Yes": 0.9955373792159788, "No": 0.004461766567526457}, "ground_truth": 1}, {"key": "39703329", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.934985469926277, "res": {"Yes": 0.934985469926277, "No": 0.06501105153002615}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9789670439408545, "res": {"Yes": 0.9789670439408545, "No": 0.021032534041955493}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9548620606917153, "res": {"Yes": 0.9548620606917153, "No": 0.045137170153442485}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.06068914058315017, "res": {"No": 0.9393091600810446, "Yes": 0.06068914058315017}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9887995216965049, "res": {"Yes": 0.9887995216965049, "No": 0.01119946802026263}, "ground_truth": 1}, {"key": "34033324", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9969353681007543, "res": {"Yes": 0.9969353681007543, "No": 0.003064137966152105}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5844209505928362, "res": {"Yes": 0.5844209505928362, "No": 0.41556739735789544}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5319315996463074, "res": {"Yes": 0.5319315996463074, "No": 0.46806008713118397}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7971881143496, "res": {"Yes": 0.7971881143496, "No": 0.2028032260190226}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9966977598282952, "res": {"Yes": 0.9966977598282952, "No": 0.0032998475782021865}, "ground_truth": 1}, {"key": "35658862", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999314843826759, "res": {"Yes": 0.999314843826759, "No": 0.0006847142226246845}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.764170994551837, "res": {"Yes": 0.764170994551837, "No": 0.2358269041639674}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7128582258960386, "res": {"Yes": 0.7128582258960386, "No": 0.2871398499069619}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.857595719442301, "res": {"Yes": 0.857595719442301, "No": 0.14239927091447332}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997167646004634, "res": {"Yes": 0.997167646004634, "No": 0.00283124991147511}, "ground_truth": 1}, {"key": "36092657", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9914599283678694, "res": {"Yes": 0.9914599283678694, "No": 0.008536126034822643}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991739195924446, "res": {"Yes": 0.9991739195924446, "No": 0.0008243964624642966}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.36998738815217985, "res": {"No": 0.6300111067437354, "Yes": 0.36998738815217985}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9979110465066579, "res": {"Yes": 0.9979110465066579, "No": 0.002088480522796304}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995420298203714, "res": {"Yes": 0.9995420298203714, "No": 0.00045743790922506426}, "ground_truth": 1}, {"key": "26333438", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9808105954436566, "res": {"Yes": 0.9808105954436566, "No": 0.019188968929091426}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9836691973563434, "res": {"Yes": 0.9836691973563434, "No": 0.016330495982288078}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999040904456155, "res": {"Yes": 0.9999040904456155, "No": 9.535049829256861e-05}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998566603941031, "res": {"Yes": 0.9998566603941031, "No": 0.0001427698021442094}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999937270200753, "res": {"Yes": 0.9999937270200753, "No": 6.0033314569588866e-06}, "ground_truth": 1}, {"key": "34184963", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999909853566321, "res": {"Yes": 0.9999909853566321, "No": 8.513478027414573e-06}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.99988680771673, "res": {"Yes": 0.99988680771673, "No": 0.00011299917953844712}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9960843562040207, "res": {"Yes": 0.9960843562040207, "No": 0.003915238624718595}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995095209541931, "res": {"Yes": 0.9995095209541931, "No": 0.0004898099986080047}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993840157962146, "res": {"Yes": 0.9993840157962146, "No": 0.0006145683539962057}, "ground_truth": 1}, {"key": "35069975", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999475965531086, "res": {"Yes": 0.9999475965531086, "No": 5.225562590984355e-05}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997741976971782, "res": {"Yes": 0.9997741976971782, "No": 0.00022469536645806587}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.5770772957543828, "res": {"Yes": 0.5770772957543828, "No": 0.422920906368356}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.05669163556671093, "res": {"No": 0.9433056157894429, "Yes": 0.05669163556671093}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994521203009242, "res": {"Yes": 0.9994521203009242, "No": 0.0005475786246047711}, "ground_truth": 1}, {"key": "36443950", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9581298858329809, "res": {"Yes": 0.9581298858329809, "No": 0.04186859733457744}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9979708806517579, "res": {"Yes": 0.9979708806517579, "No": 0.0020277458938384304}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9754745914033677, "res": {"Yes": 0.9754745914033677, "No": 0.024521720577618342}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9784109606942104, "res": {"Yes": 0.9784109606942104, "No": 0.021585834275826086}, "ground_truth": 1}, {"key": "29460858", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.05710046607038396, "res": {"No": 0.9428944468167083, "Yes": 0.05710046607038396}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.2634688326921009, "res": {"No": 0.7365273342902432, "Yes": 0.2634688326921009}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9505627189616689, "res": {"Yes": 0.9505627189616689, "No": 0.04943657223760066}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9961070664889714, "res": {"Yes": 0.9961070664889714, "No": 0.0038926909483753274}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9972451716229941, "res": {"Yes": 0.9972451716229941, "No": 0.0027538985959397327}, "ground_truth": 1}, {"key": "36155704", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9958006822965574, "res": {"Yes": 0.9958006822965574, "No": 0.0041984729631772974}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9970244756736635, "res": {"Yes": 0.9970244756736635, "No": 0.0029751643434931425}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.37644119218418687, "res": {"No": 0.6235560638134049, "Yes": 0.37644119218418687}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9931782365926061, "res": {"Yes": 0.9931782365926061, "No": 0.006821420120439014}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9943754451719287, "res": {"Yes": 0.9943754451719287, "No": 0.005624428140336274}, "ground_truth": 1}, {"key": "37185211", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9935363035409975, "res": {"Yes": 0.9935363035409975, "No": 0.006463579580654901}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974953788107778, "res": {"Yes": 0.9974953788107778, "No": 0.002504076437630341}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.11064742326647689, "res": {"No": 0.8893489329235148, "Yes": 0.11064742326647689}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9600626828657838, "res": {"Yes": 0.9600626828657838, "No": 0.03993320083351114}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9854630694631995, "res": {"Yes": 0.9854630694631995, "No": 0.014535600961581093}, "ground_truth": 1}, {"key": "36454885", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7637265062629267, "res": {"Yes": 0.7637265062629267, "No": 0.23626403664568002}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9899419103392799, "res": {"Yes": 0.9899419103392799, "No": 0.010056531048194373}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9783207035111654, "res": {"Yes": 0.9783207035111654, "No": 0.021678491176769635}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9325771791915611, "res": {"Yes": 0.9325771791915611, "No": 0.06742179131765773}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9941580181285045, "res": {"Yes": 0.9941580181285045, "No": 0.005841540106749691}, "ground_truth": 1}, {"key": "33148906", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9772758743155682, "res": {"Yes": 0.9772758743155682, "No": 0.02272275349297295}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9516787582015442, "res": {"Yes": 0.9516787582015442, "No": 0.048318575806170425}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.12787266690486965, "res": {"No": 0.8721127264294314, "Yes": 0.12787266690486965}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9870286397490343, "res": {"Yes": 0.9870286397490343, "No": 0.01296894014338557}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9832079115770739, "res": {"Yes": 0.9832079115770739, "No": 0.016791524733746108}, "ground_truth": 1}, {"key": "18086604", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9748728565753779, "res": {"Yes": 0.9748728565753779, "No": 0.02511886805254378}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9885896505088063, "res": {"Yes": 0.9885896505088063, "No": 0.011408096002262672}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9640390026592008, "res": {"Yes": 0.9640390026592008, "No": 0.035960469977929836}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9785536351547826, "res": {"Yes": 0.9785536351547826, "No": 0.02144583553520662}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.06817869179328165, "res": {"No": 0.9318180524948292, "Yes": 0.06817869179328165}, "ground_truth": 1}, {"key": "33693397", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8560630833957469, "res": {"Yes": 0.8560630833957469, "No": 0.14393614719554723}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.286576575301678, "res": {"No": 0.7134193091866211, "Yes": 0.286576575301678}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.564373732872817, "res": {"Yes": 0.564373732872817, "No": 0.43562539095938924}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986878869740339, "res": {"Yes": 0.9986878869740339, "No": 0.0013115118804829199}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999888714767661, "res": {"Yes": 0.999888714767661, "No": 0.00011109609616109476}, "ground_truth": 1}, {"key": "39501530", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987746890073005, "res": {"Yes": 0.9987746890073005, "No": 0.001224469732659059}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.997078875112175, "res": {"Yes": 0.997078875112175, "No": 0.0029207524720275095}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9986386685534636, "res": {"Yes": 0.9986386685534636, "No": 0.00136131926722218}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980113669560645, "res": {"Yes": 0.9980113669560645, "No": 0.00198856103459659}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999114803880921, "res": {"Yes": 0.9999114803880921, "No": 8.826322632585222e-05}, "ground_truth": 1}, {"key": "30948874", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994802263291609, "res": {"Yes": 0.9994802263291609, "No": 0.0005195227272844099}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993385347246748, "res": {"Yes": 0.9993385347246748, "No": 0.0006612574554980839}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9978769766088974, "res": {"Yes": 0.9978769766088974, "No": 0.00212288344256189}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8213239151554008, "res": {"Yes": 0.8213239151554008, "No": 0.17867576220703693}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985904047140258, "res": {"Yes": 0.9985904047140258, "No": 0.0014091389991621687}, "ground_truth": 1}, {"key": "39410675", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9135905352264727, "res": {"Yes": 0.9135905352264727, "No": 0.08640726681964879}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.8480642326578809, "res": {"Yes": 0.8480642326578809, "No": 0.15193416149967792}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 6.573284016808228e-06, "res": {"No": 0.999992773397112, "Yes": 6.573284016808228e-06}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9950833106820056, "res": {"Yes": 0.9950833106820056, "No": 0.004914791241690976}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990834843572629, "res": {"Yes": 0.9990834843572629, "No": 0.000915299704883109}, "ground_truth": 1}, {"key": "32903337", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999674242730425, "res": {"Yes": 0.999674242730425, "No": 0.0003251086902518974}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994156829797197, "res": {"Yes": 0.9994156829797197, "No": 0.0005840882929531331}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.4407849121782459, "res": {"No": 0.5592081017832599, "Yes": 0.4407849121782459}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9980947202542005, "res": {"Yes": 0.9980947202542005, "No": 0.0019049174589068655}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9924828227732807, "res": {"Yes": 0.9924828227732807, "No": 0.007516005993493169}, "ground_truth": 1}, {"key": "27685132", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9983072114854469, "res": {"Yes": 0.9983072114854469, "No": 0.001692626185957225}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9831808383367667, "res": {"Yes": 0.9831808383367667, "No": 0.016818182267263983}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.22864154670923617, "res": {"No": 0.7713569518418596, "Yes": 0.22864154670923617}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.8464472201771701, "res": {"Yes": 0.8464472201771701, "No": 0.15354853085526252}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.910518774534642, "res": {"Yes": 0.910518774534642, "No": 0.08947144096376654}, "ground_truth": 1}, {"key": "22791471", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8603006136993832, "res": {"Yes": 0.8603006136993832, "No": 0.1396905863140601}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 3.022591164398001e-05, "res": {"No": 0.9999696483206215, "Yes": 3.022591164398001e-05}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9551414731966911, "res": {"Yes": 0.9551414731966911, "No": 0.04485818544476849}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9856573716744951, "res": {"Yes": 0.9856573716744951, "No": 0.014342200553071208}, "ground_truth": 1}, {"key": "32292348", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9900261530304053, "res": {"Yes": 0.9900261530304053, "No": 0.009973177895596484}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9412852409354906, "res": {"Yes": 0.9412852409354906, "No": 0.058713863768007524}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9996601850501834, "res": {"Yes": 0.9996601850501834, "No": 0.00033951263335784353}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999372264343427, "res": {"Yes": 0.9999372264343427, "No": 6.265218505848418e-05}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999753699393249, "res": {"Yes": 0.9999753699393249, "No": 2.4309593288259257e-05}, "ground_truth": 1}, {"key": "20482930", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999881244990143, "res": {"Yes": 0.9999881244990143, "No": 1.1504629941608837e-05}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999974535534225, "res": {"Yes": 0.999974535534225, "No": 2.4896508131756087e-05}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.009549284965644321, "res": {"No": 0.9904501195210228, "Yes": 0.009549284965644321}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.997197992172464, "res": {"Yes": 0.997197992172464, "No": 0.0028019933622584975}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9310219362058464, "res": {"Yes": 0.9310219362058464, "No": 0.06897576968795878}, "ground_truth": 1}, {"key": "11635754", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9944548914857221, "res": {"Yes": 0.9944548914857221, "No": 0.0055447968248294064}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997205879028329, "res": {"Yes": 0.9997205879028329, "No": 0.0002790537897283931}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.003616621414000441, "res": {"No": 0.9963829642904065, "Yes": 0.003616621414000441}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.7892973892112769, "res": {"Yes": 0.7892973892112769, "No": 0.21069811596526247}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9935607817951517, "res": {"Yes": 0.9935607817951517, "No": 0.006438462561843778}, "ground_truth": 1}, {"key": "40029096", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9949651615043508, "res": {"Yes": 0.9949651615043508, "No": 0.0050327410647897815}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9744673109794203, "res": {"Yes": 0.9744673109794203, "No": 0.025530785001583293}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9999675027220479, "res": {"Yes": 0.9999675027220479, "No": 3.229724905301579e-05}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.951497846991941, "res": {"Yes": 0.951497846991941, "No": 0.048501793613541566}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997868268346288, "res": {"Yes": 0.9997868268346288, "No": 0.00021297282128442718}, "ground_truth": 1}, {"key": "40414719", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99984355362901, "res": {"Yes": 0.99984355362901, "No": 0.0001560659318402912}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.999722375444831, "res": {"Yes": 0.999722375444831, "No": 0.0002772219802391735}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7583457217689636, "res": {"Yes": 0.7583457217689636, "No": 0.24165250850701078}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9837506347654078, "res": {"Yes": 0.9837506347654078, "No": 0.016247219378784195}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.761743434593649, "res": {"Yes": 0.761743434593649, "No": 0.2382446719432718}, "ground_truth": 1}, {"key": "39537616", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7691629371967084, "res": {"Yes": 0.7691629371967084, "No": 0.23082655376296374}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.13715456190410538, "res": {"No": 0.862845034561512, "Yes": 0.13715456190410538}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 5.974793627940585e-06, "res": {"No": 0.9999933694113825, "Yes": 5.974793627940585e-06}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9955588825578311, "res": {"Yes": 0.9955588825578311, "No": 0.0044401816109828855}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9517881447339348, "res": {"Yes": 0.9517881447339348, "No": 0.0482090556025698}, "ground_truth": 1}, {"key": "33245830", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986461571731892, "res": {"Yes": 0.9986461571731892, "No": 0.0013536400253421842}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.0009151777035640167, "res": {"No": 0.999083722538794, "Yes": 0.0009151777035640167}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.008497725835908979, "res": {"No": 0.9915016469049647, "Yes": 0.008497725835908979}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9598352863115819, "res": {"Yes": 0.9598352863115819, "No": 0.040164329625892746}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9941694480289436, "res": {"Yes": 0.9941694480289436, "No": 0.005829141762530064}, "ground_truth": 1}, {"key": "39243601", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9847447026807453, "res": {"Yes": 0.9847447026807453, "No": 0.015254923127403697}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9680622102339219, "res": {"Yes": 0.9680622102339219, "No": 0.03193741731450125}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9828546042485956, "res": {"Yes": 0.9828546042485956, "No": 0.01713668143133085}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986009807411479, "res": {"Yes": 0.9986009807411479, "No": 0.0013967269113895737}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974615720707957, "res": {"Yes": 0.9974615720707957, "No": 0.0025371154319779486}, "ground_truth": 1}, {"key": "35815905", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8397337682006318, "res": {"Yes": 0.8397337682006318, "No": 0.16025682410010747}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.19964234266551348, "res": {"No": 0.8003542394567189, "Yes": 0.19964234266551348}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0010063849765911486, "res": {"No": 0.9989929455200578, "Yes": 0.0010063849765911486}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.09447891415638926, "res": {"No": 0.9055192526365955, "Yes": 0.09447891415638926}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.014562191972251441, "res": {"No": 0.9854373768049833, "Yes": 0.014562191972251441}, "ground_truth": 1}, {"key": "35260212", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9969500605440064, "res": {"Yes": 0.9969500605440064, "No": 0.003049315926232314}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.912536691017151, "res": {"Yes": 0.912536691017151, "No": 0.08746131479583197}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9837018311232752, "res": {"Yes": 0.9837018311232752, "No": 0.016297932821153254}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9914011018382731, "res": {"Yes": 0.9914011018382731, "No": 0.008598791576123439}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999908977336814, "res": {"Yes": 0.999908977336814, "No": 9.090105051744865e-05}, "ground_truth": 1}, {"key": "39193924", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999797314573467, "res": {"Yes": 0.999797314573467, "No": 0.00020257142855674524}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999921773835968, "res": {"Yes": 0.9999921773835968, "No": 7.714661104074236e-06}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.015824925795987738, "res": {"No": 0.9841721136296394, "Yes": 0.015824925795987738}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.522437144493294, "res": {"Yes": 0.522437144493294, "No": 0.4775553068045249}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5039576511183211, "res": {"Yes": 0.5039576511183211, "No": 0.4960385368565643}, "ground_truth": 1}, {"key": "40658569", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.702012450049741, "res": {"Yes": 0.702012450049741, "No": 0.2979819395053727}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.5014875988507747, "res": {"Yes": 0.5014875988507747, "No": 0.4985083198251787}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.28711596086524754, "res": {"No": 0.7128831906282393, "Yes": 0.28711596086524754}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9851758360356042, "res": {"Yes": 0.9851758360356042, "No": 0.014823003712426959}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9981498207956331, "res": {"Yes": 0.9981498207956331, "No": 0.0018497662485687603}, "ground_truth": 1}, {"key": "33497596", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9985991952441905, "res": {"Yes": 0.9985991952441905, "No": 0.0013999944593162579}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9701425786378354, "res": {"Yes": 0.9701425786378354, "No": 0.029854431237310648}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.0389258626366848, "res": {"No": 0.9610647178524734, "Yes": 0.0389258626366848}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.008068382100573764, "res": {"No": 0.9919218450825732, "Yes": 0.008068382100573764}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00042914242548353554, "res": {"No": 0.9995666829789496, "Yes": 0.00042914242548353554}, "ground_truth": 1}, {"key": "40339241", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.39017617932660187, "res": {"No": 0.6098189311860363, "Yes": 0.39017617932660187}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.13997086292465005, "res": {"No": 0.8600199520031816, "Yes": 0.13997086292465005}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.8433976365179177, "res": {"Yes": 0.8433976365179177, "No": 0.1566013930298188}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996251663376968, "res": {"Yes": 0.9996251663376968, "No": 0.00037471230990829035}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987683862595123, "res": {"Yes": 0.9987683862595123, "No": 0.0012315546064177601}, "ground_truth": 1}, {"key": "31792608", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994826054947233, "res": {"Yes": 0.9994826054947233, "No": 0.0005172025400098679}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995567971134283, "res": {"Yes": 0.9995567971134283, "No": 0.0004430510311872101}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9984780835911565, "res": {"Yes": 0.9984780835911565, "No": 0.0015216066435835656}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993088914256195, "res": {"Yes": 0.9993088914256195, "No": 0.0006909652672027965}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986513912911447, "res": {"Yes": 0.9986513912911447, "No": 0.0013484830297527668}, "ground_truth": 1}, {"key": "33132662", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9981244100213229, "res": {"Yes": 0.9981244100213229, "No": 0.0018754830988997459}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9641315191730232, "res": {"Yes": 0.9641315191730232, "No": 0.03586814511835987}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.7903260319396129, "res": {"Yes": 0.7903260319396129, "No": 0.20967293808960102}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984111824091696, "res": {"Yes": 0.9984111824091696, "No": 0.0015877975685612662}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994046108445075, "res": {"Yes": 0.9994046108445075, "No": 0.0005943239600391012}, "ground_truth": 1}, {"key": "37577457", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9959303754575847, "res": {"Yes": 0.9959303754575847, "No": 0.00406951887111767}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9892811269605978, "res": {"Yes": 0.9892811269605978, "No": 0.010717787870473046}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.605859220080002, "res": {"Yes": 0.605859220080002, "No": 0.3941213193298897}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.576509650271667, "res": {"Yes": 0.576509650271667, "No": 0.42348598021799133}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9615961730330833, "res": {"Yes": 0.9615961730330833, "No": 0.03839904459640226}, "ground_truth": 1}, {"key": "38701278", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8229074410003017, "res": {"Yes": 0.8229074410003017, "No": 0.17707772827618215}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.23446048799112196, "res": {"No": 0.7654683731668606, "Yes": 0.23446048799112196}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9954955595601389, "res": {"Yes": 0.9954955595601389, "No": 0.004503576140149377}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989388152551866, "res": {"Yes": 0.9989388152551866, "No": 0.001060054136492038}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9608742709967526, "res": {"Yes": 0.9608742709967526, "No": 0.03912267722246839}, "ground_truth": 1}, {"key": "34570783", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9826565848934931, "res": {"Yes": 0.9826565848934931, "No": 0.017339883954688027}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9951714802628524, "res": {"Yes": 0.9951714802628524, "No": 0.004828381309962724}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9847726693350467, "res": {"Yes": 0.9847726693350467, "No": 0.015227032146112105}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9973637320736642, "res": {"Yes": 0.9973637320736642, "No": 0.002635921876290894}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9907821324374658, "res": {"Yes": 0.9907821324374658, "No": 0.009217356464880023}, "ground_truth": 1}, {"key": "39064526", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994466435881626, "res": {"Yes": 0.9994466435881626, "No": 0.0005530609198676888}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9823279392699066, "res": {"Yes": 0.9823279392699066, "No": 0.017671049499300862}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.08041826113839552, "res": {"No": 0.9195801976324364, "Yes": 0.08041826113839552}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9281879262154192, "res": {"Yes": 0.9281879262154192, "No": 0.07180936354073071}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7384712190082481, "res": {"Yes": 0.7384712190082481, "No": 0.2615211811750553}, "ground_truth": 1}, {"key": "40741545", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9399008359059645, "res": {"Yes": 0.9399008359059645, "No": 0.06009845169014691}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.34749642562549143, "res": {"No": 0.6524960457218827, "Yes": 0.34749642562549143}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9905045125732972, "res": {"Yes": 0.9905045125732972, "No": 0.009493835364577976}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991069242297592, "res": {"Yes": 0.9991069242297592, "No": 0.0008928562181157824}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993604393061839, "res": {"Yes": 0.9993604393061839, "No": 0.0006392931788278758}, "ground_truth": 1}, {"key": "36929751", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990214966469309, "res": {"Yes": 0.9990214966469309, "No": 0.0009783564363316133}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997590623701338, "res": {"Yes": 0.9997590623701338, "No": 0.00024040080661624788}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9937757136274292, "res": {"Yes": 0.9937757136274292, "No": 0.006224057211930982}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.5644892324867147, "res": {"Yes": 0.5644892324867147, "No": 0.4355084847939649}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995230889582407, "res": {"Yes": 0.9995230889582407, "No": 0.0004767558704895186}, "ground_truth": 1}, {"key": "23984730", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9922651491128832, "res": {"Yes": 0.9922651491128832, "No": 0.007734545156366907}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9965015688203701, "res": {"Yes": 0.9965015688203701, "No": 0.0034975379530635935}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.9878558734008674, "res": {"Yes": 0.9878558734008674, "No": 0.01214350281452358}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9256061581323168, "res": {"Yes": 0.9256061581323168, "No": 0.07439351536605966}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9579517630512504, "res": {"Yes": 0.9579517630512504, "No": 0.04204357073383554}, "ground_truth": 1}, {"key": "36007415", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975399785244459, "res": {"Yes": 0.9975399785244459, "No": 0.002459747442398537}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.43565771556262634, "res": {"No": 0.5643381220138071, "Yes": 0.43565771556262634}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_2_ft_gpt35", "target_model": "human", "recognition_score": 0.1711663822361093, "res": {"No": 0.8288286583083332, "Yes": 0.1711663822361093}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_2_ft_gpt35", "target_model": "claude", "recognition_score": 0.9659887507729521, "res": {"Yes": 0.9659887507729521, "No": 0.0340039358762362}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_2_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987920458646594, "res": {"Yes": 0.9987920458646594, "No": 0.0012056401599909116}, "ground_truth": 1}, {"key": "38875041", "model": "cnn_2_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987692196322014, "res": {"Yes": 0.9987692196322014, "No": 0.0012296348790084488}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_2_ft_gpt35", "target_model": "llama", "recognition_score": 0.9656480322617813, "res": {"Yes": 0.9656480322617813, "No": 0.034304442988723746}, "ground_truth": 0}]