[{"key": "33773576", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998632156758288, "res": {"Yes": 0.9998632156758288, "No": 0.00013617414682470108}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9973534143992242, "res": {"Yes": 0.9973534143992242, "No": 0.0026462612082558314}, "ground_truth": 1}, {"key": "33773576", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999983237218497, "res": {"Yes": 0.999983237218497, "No": 1.636129620162531e-05}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999827604126034, "res": {"Yes": 0.9999827604126034, "No": 1.6937524717324282e-05}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.756288163143569e-07, "res": {"No": 0.9999989719621284, "Yes": 6.756288163143569e-07}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 2.860815290906044e-07}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999901509395023, "res": {"Yes": 0.9999901509395023, "No": 9.543244843398645e-06}, "ground_truth": 1}, {"key": "37642631", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9226322619102371, "res": {"Yes": 0.9226322619102371, "No": 0.07736687976337461}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 1.768892346865308e-06}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.717760823789893e-06, "res": {"No": 0.999995276659155, "Yes": 3.717760823789893e-06}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0448055931614583, "res": {"No": 0.955194223296265, "Yes": 0.0448055931614583}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9481876189727204, "res": {"Yes": 0.9481876189727204, "No": 0.05181188582275338}, "ground_truth": 1}, {"key": "36609836", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8784489442540142, "res": {"Yes": 0.8784489442540142, "No": 0.12155084820560104}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999807339855921, "res": {"Yes": 0.9999807339855921, "No": 1.9064492203905454e-05}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.008376202747000619, "res": {"No": 0.9916234261535167, "Yes": 0.008376202747000619}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0001457186281727176, "res": {"No": 0.9998537999282723, "Yes": 0.0001457186281727176}, "ground_truth": 1}, {"key": "41035610", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0005917785878786831, "res": {"No": 0.999407942934993, "Yes": 0.0005917785878786831}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.1803753309407617e-05, "res": {"No": 0.9999876476902904, "Yes": 1.1803753309407617e-05}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9873391742393611, "res": {"Yes": 0.9873391742393611, "No": 0.01266042110729237}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9922585803393388, "res": {"Yes": 0.9922585803393388, "No": 0.0077408985994438986}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996150415555235, "res": {"Yes": 0.9996150415555235, "No": 0.00038440095364689454}, "ground_truth": 1}, {"key": "37592684", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9960750089922792, "res": {"Yes": 0.9960750089922792, "No": 0.0039246386330461696}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.133534741372111, "res": {"No": 0.8664648553223836, "Yes": 0.133534741372111}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00021722725377298427, "res": {"No": 0.9997824209237612, "Yes": 0.00021722725377298427}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.007024688544834775, "res": {"No": 0.9929750729712794, "Yes": 0.007024688544834775}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.222510652971141, "res": {"No": 0.7774891966571582, "Yes": 0.222510652971141}, "ground_truth": 1}, {"key": "38951040", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.16227418084802672, "res": {"No": 0.8377256321879446, "Yes": 0.16227418084802672}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9829670059965037, "res": {"Yes": 0.9829670059965037, "No": 0.017032857606481464}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.05960689641165231, "res": {"No": 0.9403922570756522, "Yes": 0.05960689641165231}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9982187090851926, "res": {"Yes": 0.9982187090851926, "No": 0.0017809470599823181}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, " Yes": 3.585466714587718e-07}, "ground_truth": 1}, {"key": "40774469", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 4.456308135626758e-07}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998338996861849, "res": {"Yes": 0.9998338996861849, "No": 0.00016574799922696928}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.154656897172034e-06, "res": {"No": 0.9999944422379444, "Yes": 5.154656897172034e-06}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0006644778591032638, "res": {"No": 0.9993348455133894, "Yes": 0.0006644778591032638}, "ground_truth": 1}, {"key": "40876288", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.18978764305690488, "res": {"No": 0.8102113090235423, "Yes": 0.18978764305690488}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0033716845265352674, "res": {"No": 0.9966277719762442, "Yes": 0.0033716845265352674}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.4367531208331228e-05, "res": {"No": 0.999975489140396, "Yes": 2.4367531208331228e-05}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0018111486893500597, "res": {"No": 0.9981885368833847, "Yes": 0.0018111486893500597}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.007578784866713249, "res": {"No": 0.9924202363979622, "Yes": 0.007578784866713249}, "ground_truth": 1}, {"key": "40340131", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.11049058116313427, "res": {"No": 0.8895087721821769, "Yes": 0.11049058116313427}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.3069244048469851, "res": {"No": 0.6930752082967386, "Yes": 0.3069244048469851}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.558943019975452e-05, "res": {"No": 0.999934246531854, "Yes": 6.558943019975452e-05}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991442921269761, "res": {"Yes": 0.9991442921269761, "No": 0.0008549137254716206}, "ground_truth": 1}, {"key": "30121591", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.002262179839062552, "res": {"No": 0.9977372853070635, "Yes": 0.002262179839062552}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 8.346619094144959e-06, "res": {"No": 0.9999913429644723, "Yes": 8.346619094144959e-06}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.628505231125158e-06, "res": {"No": 0.9999965878943212, "Yes": 1.628505231125158e-06}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00015647567365034533, "res": {"No": 0.9998428385111608, "Yes": 0.00015647567365034533}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.001675074394608112, "res": {"No": 0.9983206367112666, "Yes": 0.001675074394608112}, "ground_truth": 1}, {"key": "35623366", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.08487028898288879, "res": {"No": 0.9151291006983417, "Yes": 0.08487028898288879}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0007586775546630973, "res": {"No": 0.9992385445544495, "Yes": 0.0007586775546630973}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0003096252074967343, "res": {"No": 0.9996898497565339, "Yes": 0.0003096252074967343}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9321199880875061, "res": {"Yes": 0.9321199880875061, "No": 0.0678797175258494}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997092704700228, "res": {"Yes": 0.9997092704700228, "No": 0.0002905011566781083}, "ground_truth": 1}, {"key": "41014093", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9959734214945819, "res": {"Yes": 0.9959734214945819, "No": 0.004026120587609924}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999691715222073, "res": {"Yes": 0.9999691715222073, "No": 3.065217302661805e-05}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8806752202430694, "res": {"Yes": 0.8806752202430694, "No": 0.1193242740396687}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6226929990878485, "res": {"Yes": 0.6226929990878485, "No": 0.3773065469708808}, "ground_truth": 1}, {"key": "11387984", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.09081229455072153, "res": {"No": 0.9091874958617934, "Yes": 0.09081229455072153}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.35571710959134534, "res": {"No": 0.644282670391287, "Yes": 0.35571710959134534}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.6318204331304296, "res": {"Yes": 0.6318204331304296, "No": 0.36817927467275724}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984180670770559, "res": {"Yes": 0.9984180670770559, "No": 0.0015812810014825007}, "ground_truth": 1}, {"key": "39508312", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999810915907662, "res": {"Yes": 0.9999810915907662, "No": 1.87048071555148e-05}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.01801608155906444, "res": {"No": 0.9819838861285827, "Yes": 0.01801608155906444}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.03943211867390009, "res": {"No": 0.9605676223232754, "Yes": 0.03943211867390009}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999129107124922, "res": {"Yes": 0.9999129107124922, "No": 8.676580200919979e-05}, "ground_truth": 1}, {"key": "35815369", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.20161109693084076, "res": {"No": 0.7983887937241764, "Yes": 0.20161109693084076}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0012536236517971173, "res": {"No": 0.9987421081100807, "Yes": 0.0012536236517971173}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0019458573541232343, "res": {"No": 0.9980539818534192, "Yes": 0.0019458573541232343}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3610009821557175, "res": {"No": 0.638998897473292, "Yes": 0.3610009821557175}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995509587192274, "res": {"Yes": 0.9995509587192274, "No": 0.0004488826782601867}, "ground_truth": 1}, {"key": "35802823", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06988064245984701, "res": {"No": 0.9301189897978832, "Yes": 0.06988064245984701}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9843722584880796, "res": {"Yes": 0.9843722584880796, "No": 0.01562739211058636}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0026470459410349654, "res": {"No": 0.9973522255546627, "Yes": 0.0026470459410349654}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.012083884180946025, "res": {"No": 0.987915910190151, "Yes": 0.012083884180946025}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974433017345093, "res": {"Yes": 0.9974433017345093, "No": 0.0025564985771655453}, "ground_truth": 1}, {"key": "38499968", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.025733284713321484, "res": {"No": 0.9742666547155168, "Yes": 0.025733284713321484}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.4211199158961284, "res": {"No": 0.5788792340121385, "Yes": 0.4211199158961284}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9929860046940313, "res": {"Yes": 0.9929860046940313, "No": 0.007013813621307059}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8685655249785782, "res": {"Yes": 0.8685655249785782, "No": 0.1314342568879435}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999922965856715, "res": {"Yes": 0.9999922965856715, "No": 7.563768599358841e-06}, "ground_truth": 1}, {"key": "36926726", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9900227636816721, "res": {"Yes": 0.9900227636816721, "No": 0.009976988377308274}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.4636244636661059, "res": {"No": 0.5363755018704714, "Yes": 0.4636244636661059}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.923376413127125e-06, "res": {"No": 0.9999903893441826, "Yes": 4.923376413127125e-06}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998087558794887, "res": {"Yes": 0.9998087558794887, "No": 0.00019024668230150483}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999795419732683, "res": {"Yes": 0.9999795419732683, "No": 1.9612508627641135e-05}, "ground_truth": 1}, {"key": "40903712", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.93892341807073, "res": {"Yes": 0.93892341807073, "No": 0.06107497934677966}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.45207640763313417, "res": {"No": 0.5479230399192685, "Yes": 0.45207640763313417}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.087916108849722e-05, "res": {"No": 0.9999690523188893, "Yes": 3.087916108849722e-05}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.08658403792287316, "res": {"No": 0.9134154532431336, "Yes": 0.08658403792287316}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.978259435160723, "res": {"Yes": 0.978259435160723, "No": 0.021740239082379088}, "ground_truth": 1}, {"key": "19614862", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5476850135953472, "res": {"Yes": 0.5476850135953472, "No": 0.4523146106559781}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.5781495365592889, "res": {"Yes": 0.5781495365592889, "No": 0.42184880969727523}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.03403289234858034, "res": {"No": 0.9659670549092552, "Yes": 0.03403289234858034}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9970782808533425, "res": {"Yes": 0.9970782808533425, "No": 0.002921386344086571}, "ground_truth": 1}, {"key": "38861704", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9719608501075447, "res": {"Yes": 0.9719608501075447, "No": 0.02803878636577873}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.023645747262054276, "res": {"No": 0.9763541771228749, "Yes": 0.023645747262054276}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9533809829214254, "res": {"Yes": 0.9533809829214254, "No": 0.0466185149610132}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9812353146100573, "res": {"Yes": 0.9812353146100573, "No": 0.01876437788291781}, "ground_truth": 1}, {"key": "34349607", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.007933156318625895, "res": {"No": 0.9920664902318884, "Yes": 0.007933156318625895}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.34252939504969343, "res": {"No": 0.657470475579521, "Yes": 0.34252939504969343}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.844649947936118e-06, "res": {"No": 0.9999958726752174, "Yes": 3.844649947936118e-06}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.5938260795447882e-05, "res": {"No": 0.9999839524287637, "Yes": 1.5938260795447882e-05}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996227831641674, "res": {"Yes": 0.9996227831641674, "No": 0.00037676835587957655}, "ground_truth": 1}, {"key": "20773800", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9838910545305052, "res": {"Yes": 0.9838910545305052, "No": 0.016108572423944874}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9972847672307881, "res": {"Yes": 0.9972847672307881, "No": 0.002714736184312061}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.13068084840988836, "res": {"No": 0.8693180285102101, "Yes": 0.13068084840988836}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.5458534204464771, "res": {"Yes": 0.5458534204464771, "No": 0.4541453172988939}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997502544316179, "res": {"Yes": 0.9997502544316179, "No": 0.0002491899751475492}, "ground_truth": 1}, {"key": "35545608", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987381829614347, "res": {"Yes": 0.9987381829614347, "No": 0.0012610870397449798}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.997412242033181, "res": {"Yes": 0.997412242033181, "No": 0.0025869388848602216}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.002424585492817333, "res": {"No": 0.9975730672747961, "Yes": 0.002424585492817333}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.998998535101024, "res": {"Yes": 0.998998535101024, "No": 0.001000751561262878}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.387685670181458e-06}, "ground_truth": 1}, {"key": "37258984", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999889589149532, "res": {"Yes": 0.9999889589149532, "No": 1.0578954023338896e-05}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999936078174301, "res": {"Yes": 0.9999936078174301, "No": 6.06931384284448e-06}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.423831898342172e-06, "res": {"No": 0.9999944422379444, "Yes": 5.423831898342172e-06}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8984295574490314, "res": {"Yes": 0.8984295574490314, "No": 0.10157029079844723}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.16096003091571293, "res": {"No": 0.8390381271363169, "Yes": 0.16096003091571293}, "ground_truth": 1}, {"key": "37274562", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8410646072682293, "res": {"Yes": 0.8410646072682293, "No": 0.15893518521928698}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9925672598560695, "res": {"Yes": 0.9925672598560695, "No": 0.007432061518416107}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0002977170557044505, "res": {"No": 0.9997016436671056, "Yes": 0.0002977170557044505}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9902396732120265, "res": {"Yes": 0.9902396732120265, "No": 0.009759991982720944}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996689994827624, "res": {"Yes": 0.9996689994827624, "No": 0.0003307274287262635}, "ground_truth": 1}, {"key": "40828068", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.009998042051584036, "res": {"No": 0.9900018462066879, "Yes": 0.009998042051584036}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7664195069104998, "res": {"Yes": 0.7664195069104998, "No": 0.23357984773665624}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.5677544841052031, "res": {"Yes": 0.5677544841052031, "No": 0.43224459881874466}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8862965037641446, "res": {"Yes": 0.8862965037641446, "No": 0.11370156659504849}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6763567334000509, "res": {"Yes": 0.6763567334000509, "No": 0.323639285417423}, "ground_truth": 1}, {"key": "37807180", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9677368962934337, "res": {"Yes": 0.9677368962934337, "No": 0.03226251335465829}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.002164745015964055, "res": {"No": 0.9978349568941437, "Yes": 0.002164745015964055}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00011398165996636226, "res": {"No": 0.9998828744557322, "Yes": 0.00011398165996636226}, "ground_truth": 1}, {"key": "40748607", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.3859522728064544e-05, "res": {"No": 0.999977753956447, "Yes": 1.3859522728064544e-05}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0001441782754715806, "res": {"No": 0.9998554685256801, "Yes": 0.0001441782754715806}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.623293425044152e-06, "res": {"No": 0.9999877668918251, "Yes": 9.623293425044152e-06}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9953415274996019, "res": {"Yes": 0.9953415274996019, "No": 0.004658416944687667}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9904439312080083, "res": {"Yes": 0.9904439312080083, "No": 0.009555930714650673}, "ground_truth": 1}, {"key": "40123819", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9785095640486071, "res": {"Yes": 0.9785095640486071, "No": 0.021490319522738038}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9923799588476055, "res": {"Yes": 0.9923799588476055, "No": 0.007619869769853762}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.7106719548200285e-06, "res": {"No": 0.9999963494876631, "Yes": 2.7106719548200285e-06}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983415487526652, "res": {"Yes": 0.9983415487526652, "No": 0.0016582928655845893}, "ground_truth": 1}, {"key": "38453867", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004779852455525709, "res": {"No": 0.9952201336940131, "Yes": 0.004779852455525709}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999995276659155, "res": {"Yes": 0.999995276659155, "No": 4.578578404730417e-06}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.012181218264333072, "res": {"No": 0.98781818840598, "Yes": 0.012181218264333072}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 2.086862116192094e-06, "res": {"No": 0.9999976607241361, "Yes": 2.086862116192094e-06}, "ground_truth": 1}, {"key": "38944856", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.21828950338991246, "res": {"No": 0.7817098289667431, "Yes": 0.21828950338991246}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 7.044285008290515e-07, "res": {"No": 0.99999861435166, "Yes": 7.044285008290515e-07}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0003425088709546126, "res": {"No": 0.9996572059673049, "Yes": 0.0003425088709546126}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.009151162120999512, "res": {"No": 0.9908484853570473, "Yes": 0.009151162120999512}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 6.081658661677737e-05, "res": {"No": 0.9999380608083109, "Yes": 6.081658661677737e-05}, "ground_truth": 1}, {"key": "35778898", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0003050941928555937, "res": {"No": 0.9996942589483242, "Yes": 0.0003050941928555937}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9737208724544043, "res": {"Yes": 0.9737208724544043, "No": 0.026278906390166556}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0015357405059003505, "res": {"No": 0.9984620375782013, "Yes": 0.0015357405059003505}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9975084256369077, "res": {"Yes": 0.9975084256369077, "No": 0.0024900163556324617}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9958140412514769, "res": {"Yes": 0.9958140412514769, "No": 0.004184434540250044}, "ground_truth": 1}, {"key": "32530125", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9111057110317028, "res": {"Yes": 0.9111057110317028, "No": 0.08889274040792255}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.02972163640246927, "res": {"No": 0.970277001204014, "Yes": 0.02972163640246927}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.37672869217848187, "res": {"No": 0.6232709768155332, "Yes": 0.37672869217848187}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998418850414879, "res": {"Yes": 0.9998418850414879, "No": 0.00015793958049530816}, "ground_truth": 1}, {"key": "35010363", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998184059102031, "res": {"Yes": 0.9998184059102031, "No": 0.00018141887026080738}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998941975374753, "res": {"Yes": 0.9998941975374753, "No": 0.00010561733953810892}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.28037303349639364, "res": {"No": 0.719626752998678, "Yes": 0.28037303349639364}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.01812811918648972, "res": {"No": 0.981871813793549, "Yes": 0.01812811918648972}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993391303705925, "res": {"Yes": 0.9993391303705925, "No": 0.0006608520967220754}, "ground_truth": 1}, {"key": "27514800", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995606062817066, "res": {"Yes": 0.9995606062817066, "No": 0.00043932658152160564}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999647611309035, "res": {"Yes": 0.9999647611309035, "No": 3.513843543354634e-05}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.39314308476643195, "res": {"No": 0.6068550583766357, "Yes": 0.39314308476643195}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999124770686805, "res": {"Yes": 0.999124770686805, "No": 0.0008746681505997561}, "ground_truth": 1}, {"key": "25725840", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998460565205136, "res": {"Yes": 0.9998460565205136, "No": 0.0001533668184186047}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.995105857137049, "res": {"Yes": 0.995105857137049, "No": 0.00489348084246652}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00044268778971712095, "res": {"No": 0.9995564396419948, "Yes": 0.00044268778971712095}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.003269559541285495, "res": {"No": 0.9967290202487011, "Yes": 0.003269559541285495}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.11747972658344197, "res": {"No": 0.8825184181213538, "Yes": 0.11747972658344197}, "ground_truth": 1}, {"key": "38327225", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.010410861945740738, "res": {"No": 0.9895808285697644, "Yes": 0.010410861945740738}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0012365117109504233, "res": {"No": 0.9987616110372675, "Yes": 0.0012365117109504233}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.114139028632174e-07, "res": {"No": 0.9999995679800934, "Yes": 2.114139028632174e-07}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.048595200893442894, "res": {"No": 0.951404714183415, "Yes": 0.048595200893442894}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.44001649681997335, "res": {"No": 0.5599821336266602, "Yes": 0.44001649681997335}, "ground_truth": 1}, {"key": "11991724", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 2.2408728720153816e-05, "res": {"No": 0.9999770387506135, "Yes": 2.2408728720153816e-05}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00022105456200889582, "res": {"No": 0.9997784880673918, "Yes": 0.00022105456200889582}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 7.746170234718901e-06, "res": {"No": 0.9999919389784903, "Yes": 7.746170234718901e-06}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9962735115559785, "res": {"Yes": 0.9962735115559785, "No": 0.003726221728944136}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9978528810646754, "res": {"Yes": 0.9978528810646754, "No": 0.002146912747876525}, "ground_truth": 1}, {"key": "32217545", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999441398352371, "res": {"Yes": 0.9999441398352371, "No": 5.556050226901124e-05}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.16172679791524264, "res": {"No": 0.8382729630297276, "Yes": 0.16172679791524264}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.023849105097375e-06, "res": {"No": 0.9999936078174301, "Yes": 3.023849105097375e-06}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.887304387834321, "res": {"Yes": 0.887304387834321, "No": 0.1126945519811183}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00023698090255798343, "res": {"No": 0.9997627567966206, "Yes": 0.00023698090255798343}, "ground_truth": 1}, {"key": "12731847", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.15097885274820283, "res": {"No": 0.8490209388657036, "Yes": 0.15097885274820283}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.129437210631353e-05, "res": {"No": 0.9999840716318578, "Yes": 1.129437210631353e-05}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.003043772131592668, "res": {"No": 0.996951958339948, "Yes": 0.003043772131592668}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00019158518844164177, "res": {"No": 0.9998082791607894, "Yes": 0.00019158518844164177}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.007194593772003186, "res": {"No": 0.9928050206933741, "Yes": 0.007194593772003186}, "ground_truth": 1}, {"key": "36827234", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7974234949675418, "res": {"Yes": 0.7974234949675418, "No": 0.20257619329897028}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0006815445080563928, "res": {"No": 0.9993175836520222, "Yes": 0.0006815445080563928}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.336581933858509e-05, "res": {"No": 0.9999561788061766, "Yes": 4.336581933858509e-05}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.003926338369540674, "res": {"No": 0.99607311645156, "Yes": 0.003926338369540674}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 6.792156326207347e-05, "res": {"No": 0.9999317434295857, "Yes": 6.792156326207347e-05}, "ground_truth": 1}, {"key": "29111539", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 2.3612791029082538e-05, "res": {"No": 0.9999757275415809, "Yes": 2.3612791029082538e-05}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00476778091171029, "res": {"No": 0.9952320534174128, "Yes": 0.00476778091171029}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0024718898486181286, "res": {"No": 0.9975281167473322, "Yes": 0.0024718898486181286}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00025958768827763, "res": {"No": 0.9997402475715051, "Yes": 0.00025958768827763}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9989193049719284, "res": {"Yes": 0.9989193049719284, "No": 0.0010805944203949906}, "ground_truth": 1}, {"key": "37763052", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.016765534796336752, "res": {"No": 0.98323418815963, "Yes": 0.016765534796336752}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999406870770727, "res": {"Yes": 0.999406870770727, "No": 0.0005929599495197039}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.8792024628955334e-05, "res": {"No": 0.9999771579518836, "Yes": 1.8792024628955334e-05}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999653571300781, "res": {"Yes": 0.9999653571300781, "No": 3.4300727297789356e-05}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 1.9891443232817093e-06}, "ground_truth": 1}, {"key": "30682335", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999888238005837, "res": {"Yes": 0.999888238005837, "No": 0.00011144648917215477}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993336543069635, "res": {"Yes": 0.9993336543069635, "No": 0.0006652582146285502}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9517156840537194, "res": {"Yes": 0.9517156840537194, "No": 0.04828414659736354}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 7.59191337312229e-07}, "ground_truth": 1}, {"key": "12261276", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 2.1005530158838478e-07}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999876476902904, "res": {"Yes": 0.9999876476902904, "No": 1.211394850840788e-05}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999726283256111, "res": {"Yes": 0.9999726283256111, "No": 2.681242924930712e-05}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999783499623655, "res": {"Yes": 0.9999783499623655, "No": 2.081359872552964e-05}, "ground_truth": 1}, {"key": "36912979", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995413149281765, "res": {"Yes": 0.9995413149281765, "No": 0.0004581572922268143}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999968263007362, "res": {"Yes": 0.9999968263007362, "No": 2.807427428000166e-06}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00016015859738850364, "res": {"No": 0.9998396205321621, "Yes": 0.00016015859738850364}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9965712953783056, "res": {"Yes": 0.9965712953783056, "No": 0.0034282008121109104}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996796051573934, "res": {"Yes": 0.9996796051573934, "No": 0.00032034981095487155}, "ground_truth": 1}, {"key": "30205259", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988441368250383, "res": {"Yes": 0.9988441368250383, "No": 0.0011556168596014926}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.27584452147029487, "res": {"No": 0.7241549573561654, "Yes": 0.27584452147029487}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0010158566828121884, "res": {"No": 0.9989840216558329, "Yes": 0.0010158566828121884}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9857849003320087, "res": {"Yes": 0.9857849003320087, "No": 0.014214908084389626}, "ground_truth": 1}, {"key": "39458032", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0011401049037227024, "res": {"No": 0.9988588865656557, "Yes": 0.0011401049037227024}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.017146983672384413, "res": {"No": 0.9828529923683663, "Yes": 0.017146983672384413}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.6857053448410105, "res": {"Yes": 0.6857053448410105, "No": 0.31429347368439786}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.344619334375058e-06, "res": {"No": 0.9999974223173222, "Yes": 2.344619334375058e-06}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, " Yes": 3.590532969522966e-07}, "ground_truth": 1}, {"key": "35116452", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999697675220106, "res": {"Yes": 0.9999697675220106, "No": 2.8671140459920588e-05}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994223508035747, "res": {"Yes": 0.9994223508035747, "No": 0.000577097920278095}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0013697412850560138, "res": {"No": 0.9986302239008594, "Yes": 0.0013697412850560138}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0002297852226230554, "res": {"No": 0.9997699073453761, "Yes": 0.0002297852226230554}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.03826563285936379, "res": {"No": 0.9617340883142322, "Yes": 0.03826563285936379}, "ground_truth": 1}, {"key": "40107476", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8443596411844538, "res": {"Yes": 0.8443596411844538, "No": 0.1556400670599651}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 4.267249856202083e-06, "res": {"No": 0.999995276659155, "Yes": 4.267249856202083e-06}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0024388686871612253, "res": {"No": 0.9975569463250171, "Yes": 0.0024388686871612253}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 3.98420767239998e-05, "res": {"No": 0.9999598739650709, "Yes": 3.98420767239998e-05}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.005417540222669312, "res": {"No": 0.9945823510805404, "Yes": 0.005417540222669312}, "ground_truth": 1}, {"key": "39501049", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.04070352422449, "res": {"No": 0.959296342347868, "Yes": 0.04070352422449}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 6.767985399181315e-05, "res": {"No": 0.999932220207154, "Yes": 6.767985399181315e-05}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.168785102175538e-07, "res": {"No": 0.9999993295729247, "Yes": 4.168785102175538e-07}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.0789728868923044e-06, "res": {"No": 0.99999861435166, "Yes": 1.0789728868923044e-06}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4421687422339075, "res": {"No": 0.5578311003303364, "Yes": 0.4421687422339075}, "ground_truth": 1}, {"key": "39642178", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.006456379933960612, "res": {"No": 0.993543602681617, "Yes": 0.006456379933960612}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0007478643101411681, "res": {"No": 0.9992518815802326, "Yes": 0.0007478643101411681}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.4634027444974713e-06, "res": {"No": 0.9999944422379444, "Yes": 3.4634027444974713e-06}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999928926002577, "res": {"Yes": 0.9999928926002577, "No": 6.708628662991022e-06}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, " Yes": 5.142151907797211e-07}, "ground_truth": 1}, {"key": "38024796", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 6.459659781197414e-07}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.1392083119624107e-06}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.05839657722654742, "res": {"No": 0.9416033681431876, "Yes": 0.05839657722654742}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.2824658275887561, "res": {"No": 0.7175337314353228, "Yes": 0.2824658275887561}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.14870502993930299, "res": {"No": 0.8512941056976324, "Yes": 0.14870502993930299}, "ground_truth": 1}, {"key": "36652079", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6276917857572826, "res": {"Yes": 0.6276917857572826, "No": 0.37230815275318496}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.005889209505017585, "res": {"No": 0.9941106605509903, "Yes": 0.005889209505017585}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.4677419144629022, "res": {"No": 0.532257885453162, "Yes": 0.4677419144629022}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3381623748125523, "res": {"No": 0.6618372825568615, "Yes": 0.3381623748125523}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.95374193548983, "res": {"Yes": 0.95374193548983, "No": 0.04625771583838725}, "ground_truth": 1}, {"key": "32193402", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.972061538803066, "res": {"Yes": 0.972061538803066, "No": 0.027938014239353447}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984532484551071, "res": {"Yes": 0.9984532484551071, "No": 0.0015466391384290044}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.02264438863795314, "res": {"No": 0.9773553447343128, "Yes": 0.02264438863795314}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9971524714222928, "res": {"Yes": 0.9971524714222928, "No": 0.0028471388535296783}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999708403221517, "res": {"Yes": 0.9999708403221517, "No": 2.880958251350733e-05}, "ground_truth": 1}, {"key": "32589706", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998704861276457, "res": {"Yes": 0.9998704861276457, "No": 0.00012924483586458218}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 7.78821466709435e-07}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.50243002463643e-06, "res": {"No": 0.9999901509395023, "Yes": 9.50243002463643e-06}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9599454548490731, "res": {"Yes": 0.9599454548490731, "No": 0.04005418566269265}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999645227323332, "res": {"Yes": 0.9999645227323332, "No": 3.526854738968841e-05}, "ground_truth": 1}, {"key": "38590589", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997887336898705, "res": {"Yes": 0.9997887336898705, "No": 0.0002110855619102865}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7984895727177487, "res": {"Yes": 0.7984895727177487, "No": 0.20151045763683373}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00016180186934119147, "res": {"No": 0.9998311584553382, "Yes": 0.00016180186934119147}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.04807814360718834, "res": {"No": 0.951915915639163, "Yes": 0.04807814360718834}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.029620707042058957, "res": {"No": 0.9703780249122896, "Yes": 0.029620707042058957}, "ground_truth": 1}, {"key": "37045414", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0008538500201773516, "res": {"No": 0.9991448876471261, "Yes": 0.0008538500201773516}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 3.023854871601124e-05, "res": {"No": 0.9999679795226665, "Yes": 3.023854871601124e-05}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 4.791082918886287e-05, "res": {"No": 0.9999518876724351, "Yes": 4.791082918886287e-05}, "ground_truth": 1}, {"key": "33310095", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.01202178329777114, "res": {"No": 0.9879772191900963, "Yes": 0.01202178329777114}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 9.17838685165249e-05, "res": {"No": 0.9999081429891136, "Yes": 9.17838685165249e-05}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.1308908512038028, "res": {"No": 0.8691088870611413, "Yes": 0.1308908512038028}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7648646415205574, "res": {"Yes": 0.7648646415205574, "No": 0.2351350850475208}, "ground_truth": 1}, {"key": "37934604", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4688597808364916, "res": {"No": 0.5311398082620413, "Yes": 0.4688597808364916}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00014864450131822575, "res": {"No": 0.9998512970173847, "Yes": 0.00014864450131822575}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0014204787731583802, "res": {"No": 0.9985776827533088, "Yes": 0.0014204787731583802}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.018597241792220016, "res": {"No": 0.9814022241751845, "Yes": 0.018597241792220016}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.11916318770812874, "res": {"No": 0.88083445190945, "Yes": 0.11916318770812874}, "ground_truth": 1}, {"key": "39012181", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.005573125228916841, "res": {"No": 0.9944258907200425, "Yes": 0.005573125228916841}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0005432439910514, "res": {"No": 0.9994565284342001, "Yes": 0.0005432439910514}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0002243545376462988, "res": {"No": 0.9997753894687232, "Yes": 0.0002243545376462988}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.3085446402078172e-06}, "ground_truth": 1}, {"key": "40221674", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.17779128017326457, "res": {"No": 0.8222083901978037, "Yes": 0.17779128017326457}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.002020482368074063, "res": {"No": 0.9979793085514317, "Yes": 0.002020482368074063}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.725736703941932e-05, "res": {"No": 0.9999522452652937, "Yes": 4.725736703941932e-05}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9294064057547474, "res": {"Yes": 0.9294064057547474, "No": 0.07059335222749598}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9785220088123788, "res": {"Yes": 0.9785220088123788, "No": 0.021477805056808096}, "ground_truth": 1}, {"key": "36884862", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9688694545439898, "res": {"Yes": 0.9688694545439898, "No": 0.031128813799276466}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9665310022737877, "res": {"Yes": 0.9665310022737877, "No": 0.03346859642344101}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.2337651088401836e-06, "res": {"No": 0.9999977799274644, "Yes": 1.2337651088401836e-06}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0051453339712254275, "res": {"No": 0.9948537748231037, "Yes": 0.0051453339712254275}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.960247428219761, "res": {"Yes": 0.960247428219761, "No": 0.03975194532840114}, "ground_truth": 1}, {"key": "39054429", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9343058703965315, "res": {"Yes": 0.9343058703965315, "No": 0.06569347325860615}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9966320307751387, "res": {"Yes": 0.9966320307751387, "No": 0.0033666166511750655}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.3997476376070116e-06, "res": {"No": 0.999985978860297, "Yes": 6.3997476376070116e-06}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998176908203386, "res": {"Yes": 0.9998176908203386, "No": 0.00018175253389449286}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 5.117027228322108e-07}, "ground_truth": 1}, {"key": "36753964", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9772650539769893, "res": {"Yes": 0.9772650539769893, "No": 0.022734122257361065}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.957195906014503, "res": {"Yes": 0.957195906014503, "No": 0.042803200549341}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.369262761864548e-05, "res": {"No": 0.9999821644040562, "Yes": 1.369262761864548e-05}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.023142331639455057, "res": {"No": 0.9768560495965599, "Yes": 0.023142331639455057}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9963562171472932, "res": {"Yes": 0.9963562171472932, "No": 0.0036421922942149153}, "ground_truth": 1}, {"key": "37612459", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9890438773247587, "res": {"Yes": 0.9890438773247587, "No": 0.010954079883657415}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.007148258631362889, "res": {"No": 0.9928509638087073, "Yes": 0.007148258631362889}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00031261192278414404, "res": {"No": 0.999684844801836, "Yes": 0.00031261192278414404}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0003229991068227776, "res": {"No": 0.9996761493709394, "Yes": 0.0003229991068227776}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0005607490941449702, "res": {"No": 0.9994389033736201, "Yes": 0.0005607490941449702}, "ground_truth": 1}, {"key": "36805789", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.002034966341556578, "res": {"No": 0.9979642299963757, "Yes": 0.002034966341556578}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0012947539524379213, "res": {"No": 0.9987041783029356, "Yes": 0.0012947539524379213}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.007539438268021163, "res": {"No": 0.9924602754076408, "Yes": 0.007539438268021163}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9961281037950864, "res": {"Yes": 0.9961281037950864, "No": 0.003871506775663243}, "ground_truth": 1}, {"key": "12757394", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8764466355897458, "res": {"Yes": 0.8764466355897458, "No": 0.12355016636605783}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.6232331703447614, "res": {"Yes": 0.6232331703447614, "No": 0.37676617854826966}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.267606715512369e-05, "res": {"No": 0.9999697675220106, "Yes": 2.267606715512369e-05}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9855221280636405, "res": {"Yes": 0.9855221280636405, "No": 0.014475824454674963}, "ground_truth": 1}, {"key": "32192542", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06663335506539159, "res": {"No": 0.9333616338168755, "Yes": 0.06663335506539159}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9518518700352254, "res": {"Yes": 0.9518518700352254, "No": 0.048140599184362844}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.496564280779043e-05, "res": {"No": 0.9999337697473201, "Yes": 6.496564280779043e-05}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 6.908268710398421e-06, "res": {"No": 0.9999925349918634, "Yes": 6.908268710398421e-06}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9979989011733367, "res": {"Yes": 0.9979989011733367, "No": 0.0020002372109105254}, "ground_truth": 1}, {"key": "34856060", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999652379302147, "res": {"Yes": 0.9999652379302147, "No": 3.385252390290093e-05}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.21216372810501608, "res": {"No": 0.7878359626660458, "Yes": 0.21216372810501608}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.02149408925537821, "res": {"No": 0.9785021411032095, "Yes": 0.02149408925537821}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 4.042032089496037e-06, "res": {"No": 0.9999950382530095, "Yes": 4.042032089496037e-06}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 4.185727253087781e-05, "res": {"No": 0.9999546292272846, "Yes": 4.185727253087781e-05}, "ground_truth": 1}, {"key": "36083416", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004534558291719748, "res": {"No": 0.9954624792945869, "Yes": 0.004534558291719748}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0019921018332837307, "res": {"No": 0.998005076510243, "Yes": 0.0019921018332837307}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.817536811695065e-06, "res": {"No": 0.9999897933310884, "Yes": 8.817536811695065e-06}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 4.7547421384581326e-05, "res": {"No": 0.9999522452652937, "Yes": 4.7547421384581326e-05}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999987335551019, "res": {"Yes": 0.9999987335551019, "No": 1.042876288706642e-06}, "ground_truth": 1}, {"key": "33839050", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9947100827518243, "res": {"Yes": 0.9947100827518243, "No": 0.005289656336325604}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.21397570466672516, "res": {"No": 0.7860237977308582, "Yes": 0.21397570466672516}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999931310055916, "res": {"Yes": 0.9999931310055916, "No": 6.701796052189856e-06}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.319789900925198e-06}, "ground_truth": 1}, {"key": "18464690", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998601168145652, "res": {"Yes": 0.9998601168145652, "No": 0.00013962699673204893}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999525591067521, "res": {"Yes": 0.999525591067521, "No": 0.00047421033024321236}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.624044071206111e-06, "res": {"No": 0.9999860980626328, "Yes": 9.624044071206111e-06}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.7723129001489013, "res": {"Yes": 0.7723129001489013, "No": 0.22768645359923267}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4946087168551908, "res": {"No": 0.5053905258745742, "Yes": 0.4946087168551908}, "ground_truth": 1}, {"key": "39212665", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0009550150103147462, "res": {"No": 0.9990444514275743, "Yes": 0.0009550150103147462}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.98329584772562, "res": {"Yes": 0.98329584772562, "No": 0.016702626441153515}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.012478381649129218, "res": {"No": 0.9875215318890164, "Yes": 0.012478381649129218}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6078002178960014, "res": {"Yes": 0.6078002178960014, "No": 0.39219931961983145}, "ground_truth": 1}, {"key": "40094011", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5719458671102116, "res": {"Yes": 0.5719458671102116, "No": 0.4280540313055516}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.005962099469205702, "res": {"No": 0.9940372629012448, "Yes": 0.005962099469205702}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.27303528245277e-05, "res": {"No": 0.9999167249015635, "Yes": 8.27303528245277e-05}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.16685848850690563, "res": {"No": 0.83313958652115, "Yes": 0.16685848850690563}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9340442303868283, "res": {"Yes": 0.9340442303868283, "No": 0.06595501237851828}, "ground_truth": 1}, {"key": "36036272", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.29216899328352086, "res": {"No": 0.7078306562397664, "Yes": 0.29216899328352086}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0007340055265635287, "res": {"No": 0.9992656880390844, "Yes": 0.0007340055265635287}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00025146091199659034, "res": {"No": 0.999748228499765, "Yes": 0.00025146091199659034}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974153186557279, "res": {"Yes": 0.9974153186557279, "No": 0.002584481167665294}, "ground_truth": 1}, {"key": "30681904", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00037514554023300586, "res": {"No": 0.9996248088718013, "Yes": 0.00037514554023300586}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0014667151066647488, "res": {"No": 0.9985329965031682, "Yes": 0.0014667151066647488}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 2.835208722607289e-06}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 1.7875279841970265e-07}, "ground_truth": 1}, {"key": "27834240", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999957534720165, "res": {"Yes": 0.9999957534720165, "No": 4.058963144883716e-06}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999944422379444, "res": {"Yes": 0.9999944422379444, "No": 5.276344655981049e-06}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.580826142540773e-06, "res": {"No": 0.9999964686909351, "Yes": 2.580826142540773e-06}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0016390794593683564, "res": {"No": 0.9983606794562184, "Yes": 0.0016390794593683564}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999355576904948, "res": {"Yes": 0.9999355576904948, "No": 6.375365769269291e-05}, "ground_truth": 1}, {"key": "35025075", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980409351774322, "res": {"Yes": 0.9980409351774322, "No": 0.0019585444679699714}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.35797379270345037, "res": {"No": 0.6420250483062072, "Yes": 0.35797379270345037}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9157089911819818, "res": {"Yes": 0.9157089911819818, "No": 0.08429050953229285}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00113236886478036, "res": {"No": 0.9988675710821123, "Yes": 0.00113236886478036}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999002763027385, "res": {"Yes": 0.9999002763027385, "No": 9.94409059782823e-05}, "ground_truth": 1}, {"key": "33316985", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9788827301193117, "res": {"Yes": 0.9788827301193117, "No": 0.021116982593011365}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0034073786760560653, "res": {"No": 0.9965923751769428, "Yes": 0.0034073786760560653}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.019670673033897e-05, "res": {"No": 0.9999796611748367, "Yes": 2.019670673033897e-05}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9485153711428531, "res": {"Yes": 0.9485153711428531, "No": 0.051483562346415886}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999139834496357, "res": {"Yes": 0.9999139834496357, "No": 8.587944907759039e-05}, "ground_truth": 1}, {"key": "17037056", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996338649837903, "res": {"Yes": 0.9996338649837903, "No": 0.0003657233809756266}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.006148961950172159, "res": {"No": 0.9938509469859802, "Yes": 0.006148961950172159}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.320760656542322e-06, "res": {"No": 0.9999893165220688, "Yes": 6.320760656542322e-06}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8938751918377318, "res": {"Yes": 0.8938751918377318, "No": 0.10612434567247733}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9948652197862465, "res": {"Yes": 0.9948652197862465, "No": 0.005134012303816133}, "ground_truth": 1}, {"key": "34050457", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9114321822410328, "res": {"Yes": 0.9114321822410328, "No": 0.0885674208048127}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0003447245036778742, "res": {"No": 0.9996550610051392, "Yes": 0.0003447245036778742}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.520222870616708e-06, "res": {"No": 0.9999931310055916, "Yes": 6.520222870616708e-06}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.18334556013537853, "res": {"No": 0.8166541751199053, "Yes": 0.18334556013537853}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9767660706458205, "res": {"Yes": 0.9767660706458205, "No": 0.023231701246294048}, "ground_truth": 1}, {"key": "34713745", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9903616015020955, "res": {"Yes": 0.9903616015020955, "No": 0.00963776060241663}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.921062540534723, "res": {"Yes": 0.921062540534723, "No": 0.07893664581178493}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.795230254132934e-06, "res": {"No": 0.9999838332276837, "Yes": 8.795230254132934e-06}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0008585368112317433, "res": {"No": 0.9991410763862468, "Yes": 0.0008585368112317433}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.576045844677203, "res": {"Yes": 0.576045844677203, "No": 0.42395313522025224}, "ground_truth": 1}, {"key": "40856210", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.021194548004012503, "res": {"No": 0.9788048366676017, "Yes": 0.021194548004012503}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8641853739573054, "res": {"Yes": 0.8641853739573054, "No": 0.13581282879777343}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998023201312406, "res": {"Yes": 0.9998023201312406, "No": 0.00019753535045386676}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997489435499461, "res": {"Yes": 0.9997489435499461, "No": 0.00025080394993184555}, "ground_truth": 1}, {"key": "40848302", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9620833015668254, "res": {"Yes": 0.9620833015668254, "No": 0.037916337165409215}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 3.6086641090310005e-07}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9936789514159561, "res": {"Yes": 0.9936789514159561, "No": 0.006319359000112298}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 2.380139622689671e-07}, "ground_truth": 1}, {"key": "40636168", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999951574563252, "res": {"Yes": 0.9999951574563252, "No": 4.112941878439521e-06}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.784557463649217e-05, "res": {"No": 0.9999815683978641, "Yes": 1.784557463649217e-05}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.013136745177445215, "res": {"No": 0.9868631743203239, "Yes": 0.013136745177445215}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8737776593733422, "res": {"Yes": 0.8737776593733422, "No": 0.12622099244980495}, "ground_truth": 1}, {"key": "34423311", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9384627131555333, "res": {"Yes": 0.9384627131555333, "No": 0.061536240580124725}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.6464371120368463, "res": {"Yes": 0.6464371120368463, "No": 0.3535608756947411}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.322809547783269e-05, "res": {"No": 0.9999764427474764, "Yes": 2.322809547783269e-05}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.6939831904654579, "res": {"Yes": 0.6939831904654579, "No": 0.3060162420021402}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.280111455404415, "res": {"No": 0.7198883704743375, "Yes": 0.280111455404415}, "ground_truth": 1}, {"key": "34833945", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0021544366605881723, "res": {"No": 0.9978454020855745, "Yes": 0.0021544366605881723}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.14855834533867762, "res": {"No": 0.8514411709431102, "Yes": 0.14855834533867762}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.822695654080109e-07, "res": {"No": 0.9999987335551019, "Yes": 6.822695654080109e-07}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9941683886425442, "res": {"Yes": 0.9941683886425442, "No": 0.005828955232978151}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996583975793978, "res": {"Yes": 0.9996583975793978, "No": 0.00033980997284358965}, "ground_truth": 1}, {"key": "21272328", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995801399459115, "res": {"Yes": 0.9995801399459115, "No": 0.0004194692652238679}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.6715991160263911, "res": {"Yes": 0.6715991160263911, "No": 0.3284005915815617}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0006615043489860241, "res": {"No": 0.9993380581802147, "Yes": 0.0006615043489860241}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.01420736907554976, "res": {"No": 0.9857923134623325, "Yes": 0.01420736907554976}, "ground_truth": 1}, {"key": "38648957", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9446187302058011, "res": {"Yes": 0.9446187302058011, "No": 0.055380407666934084}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.069012405547623, "res": {"No": 0.930987014227985, "Yes": 0.069012405547623}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0007914027137255018, "res": {"No": 0.9992079549334182, "Yes": 0.0007914027137255018}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.999736553208202, "res": {"Yes": 0.999736553208202, "No": 0.0002628042761465726}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.30362921788450353, "res": {"No": 0.6963702581488805, "Yes": 0.30362921788450353}, "ground_truth": 1}, {"key": "24942981", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.10953665904004412, "res": {"No": 0.8904625074020757, "Yes": 0.10953665904004412}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982143174316426, "res": {"Yes": 0.9982143174316426, "No": 0.0017849151498114501}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.05576099881161107, "res": {"No": 0.9442363749386546, "Yes": 0.05576099881161107}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994158020601054, "res": {"Yes": 0.9994158020601054, "No": 0.0005829541614529636}, "ground_truth": 1}, {"key": "35882366", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9917457043311522, "res": {"Yes": 0.9917457043311522, "No": 0.008251042689628724}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999748228499765, "res": {"Yes": 0.999748228499765, "No": 0.00025037869655835266}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.580176181534693e-05, "res": {"No": 0.999954033236504, "Yes": 4.580176181534693e-05}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.026774174342639498, "res": {"No": 0.9732253931364976, "Yes": 0.026774174342639498}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999870516788303, "res": {"Yes": 0.9999870516788303, "No": 1.2624767485027135e-05}, "ground_truth": 1}, {"key": "40559523", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8249464696708907, "res": {"Yes": 0.8249464696708907, "No": 0.17505327899404524}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9932098691279512, "res": {"Yes": 0.9932098691279512, "No": 0.006789832543089275}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.05196031629082185, "res": {"No": 0.9480392041439184, "Yes": 0.05196031629082185}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998433152563369, "res": {"Yes": 0.9998433152563369, "No": 0.00015647066650890332}, "ground_truth": 1}, {"key": "24632722", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991654668566406, "res": {"Yes": 0.9991654668566406, "No": 0.0008342403564033694}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9210813488238327, "res": {"Yes": 0.9210813488238327, "No": 0.07891807420406076}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.02357861079864685, "res": {"No": 0.9764141808125745, "Yes": 0.02357861079864685}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.2544647651306655, "res": {"No": 0.7455350503404454, "Yes": 0.2544647651306655}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9774319948780408, "res": {"Yes": 0.9774319948780408, "No": 0.02256751039892505}, "ground_truth": 1}, {"key": "36002759", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8676306008171655, "res": {"Yes": 0.8676306008171655, "No": 0.13236847077217073}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985844566279951, "res": {"Yes": 0.9985844566279951, "No": 0.0014148397573340962}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00016494078949694149, "res": {"No": 0.9998349723485612, "Yes": 0.00016494078949694149}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00174644846803768, "res": {"No": 0.9982534001838542, "Yes": 0.00174644846803768}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4044448309671575, "res": {"No": 0.5955548422314058, "Yes": 0.4044448309671575}, "ground_truth": 1}, {"key": "29508534", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.09980352256950428, "res": {"No": 0.9001963930168253, "Yes": 0.09980352256950428}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00624918889784691, "res": {"No": 0.9937507605306765, "Yes": 0.00624918889784691}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.886821641600662e-05, "res": {"No": 0.999910407653634, "Yes": 8.886821641600662e-05}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999621387467553, "res": {"Yes": 0.9999621387467553, "No": 3.740420225860258e-05}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, " Yes": 3.0042190508236963e-07}, "ground_truth": 1}, {"key": "15631612", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, " Yes": 1.9642974526978552e-07}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996022990639911, "res": {"Yes": 0.9996022990639911, "No": 0.00039749547801400185}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.163087479266469e-05, "res": {"No": 0.9999160097413793, "Yes": 8.163087479266469e-05}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9706720910910392, "res": {"Yes": 0.9706720910910392, "No": 0.029327527467691815}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9925424737759367, "res": {"Yes": 0.9925424737759367, "No": 0.0074570252824083735}, "ground_truth": 1}, {"key": "40731892", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7944862656014772, "res": {"Yes": 0.7944862656014772, "No": 0.20551264789612542}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983540296973868, "res": {"Yes": 0.9983540296973868, "No": 0.0016455806143299521}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.002292308249183374, "res": {"No": 0.9977076143384472, "Yes": 0.002292308249183374}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.475809167671704e-06, "res": {"No": 0.9999936078174301, "Yes": 5.475809167671704e-06}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999553222594762, "res": {"Yes": 0.999553222594762, "No": 0.0004466045636314164}, "ground_truth": 1}, {"key": "35971910", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00016310278060751682, "res": {"No": 0.9998356874507859, "Yes": 0.00016310278060751682}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.40999198838462786, "res": {"No": 0.59000796628238, "Yes": 0.40999198838462786}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.2221816078513597e-05, "res": {"No": 0.9999843100330889, "Yes": 1.2221816078513597e-05}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0011567469116865584, "res": {"No": 0.9988431842278392, "Yes": 0.0011567469116865584}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6623531738906882, "res": {"Yes": 0.6623531738906882, "No": 0.3376458546833244}, "ground_truth": 1}, {"key": "34428424", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.755566613308502, "res": {"Yes": 0.755566613308502, "No": 0.2444325444383652}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.0462553590617817e-05, "res": {"No": 0.999983356420506, "Yes": 1.0462553590617817e-05}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00011450867198244478, "res": {"No": 0.9998852582493383, "Yes": 0.00011450867198244478}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0019120301416803783, "res": {"No": 0.998087354841389, "Yes": 0.0019120301416803783}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.015400119651728147, "res": {"No": 0.984599745636536, "Yes": 0.015400119651728147}, "ground_truth": 1}, {"key": "36971005", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9741285076535509, "res": {"Yes": 0.9741285076535509, "No": 0.025871267215662852}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0036199332229988512, "res": {"No": 0.9963785878871237, "Yes": 0.0036199332229988512}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9997290453948312, "res": {"Yes": 0.9997290453948312, "No": 0.0002693168474358788}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9055512180303995, "res": {"Yes": 0.9055512180303995, "No": 0.09444729735518793}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996564909727406, "res": {"Yes": 0.9996564909727406, "No": 0.00034316629610333125}, "ground_truth": 1}, {"key": "34649067", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9823519830227944, "res": {"Yes": 0.9823519830227944, "No": 0.01764732614994511}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999815683978641, "res": {"Yes": 0.9999815683978641, "No": 1.6932884471294486e-05}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.016672968250237e-06, "res": {"No": 0.9999955150656573, "Yes": 3.016672968250237e-06}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993631792064882, "res": {"Yes": 0.9993631792064882, "No": 0.0006364020756223935}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999995276659155, "res": {"Yes": 0.999995276659155, "No": 2.780185238298777e-06}, "ground_truth": 1}, {"key": "37355154", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999977753956447, "res": {"Yes": 0.999977753956447, "No": 2.097498543519586e-05}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9819007892583049, "res": {"Yes": 0.9819007892583049, "No": 0.01809745424590364}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.021750730042704e-06, "res": {"No": 0.9999983759447187, "Yes": 1.021750730042704e-06}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3294648854217406, "res": {"No": 0.670534609595802, "Yes": 0.3294648854217406}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9882576172679856, "res": {"Yes": 0.9882576172679856, "No": 0.011742198692057025}, "ground_truth": 1}, {"key": "38674697", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987789714627155, "res": {"Yes": 0.9987789714627155, "No": 0.0012207858356696984}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.07854264133144026, "res": {"No": 0.9214572359025952, "Yes": 0.07854264133144026}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.9031217381381794e-06, "res": {"No": 0.9999975415208221, "Yes": 1.9031217381381794e-06}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 3.822273738201841e-05, "res": {"No": 0.9999609467545978, "Yes": 3.822273738201841e-05}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9681447730039476, "res": {"Yes": 0.9681447730039476, "No": 0.03185362782489748}, "ground_truth": 1}, {"key": "40525767", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8876514893264545, "res": {"Yes": 0.8876514893264545, "No": 0.11234751488489729}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0005831293071886368, "res": {"No": 0.9994167551134628, "Yes": 0.0005831293071886368}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0013987497179255, "res": {"No": 0.9986003855751407, "Yes": 0.0013987497179255}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.15128515187244118, "res": {"No": 0.8487141920855813, "Yes": 0.15128515187244118}, "ground_truth": 1}, {"key": "27165110", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.13736323656842156, "res": {"No": 0.862636182316041, "Yes": 0.13736323656842156}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00010072545597171127, "res": {"No": 0.9998990843823236, "Yes": 0.00010072545597171127}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.010212286752930743, "res": {"No": 0.9897871450206924, "Yes": 0.010212286752930743}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 6.025951938395187e-05, "res": {"No": 0.9999392527721875, "Yes": 6.025951938395187e-05}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.004215496082122626, "res": {"No": 0.9957844898128952, "Yes": 0.004215496082122626}, "ground_truth": 1}, {"key": "35497491", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.01814427853860719, "res": {"No": 0.9818557328286701, "Yes": 0.01814427853860719}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.05421886870671022, "res": {"No": 0.9457809714259204, "Yes": 0.05421886870671022}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9805063265454047, "res": {"Yes": 0.9805063265454047, "No": 0.019493652094994943}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.999265807051635, "res": {"Yes": 0.999265807051635, "No": 0.0007338323216982376}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 7.773812738430053e-08}, "ground_truth": 1}, {"key": "40690716", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999489077252547, "res": {"Yes": 0.9999489077252547, "No": 5.087606402112863e-05}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996935439372551, "res": {"Yes": 0.9996935439372551, "No": 0.0003063087431904373}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0001487706053158817, "res": {"No": 0.9998497475990228, "Yes": 0.0001487706053158817}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.4109671478167515, "res": {"No": 0.5890314506893467, "Yes": 0.4109671478167515}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9978129959858119, "res": {"Yes": 0.9978129959858119, "No": 0.0021866152034036965}, "ground_truth": 1}, {"key": "34835193", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.976694990058236, "res": {"Yes": 0.976694990058236, "No": 0.02330381262086321}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997551406029567, "res": {"Yes": 0.9997551406029567, "No": 0.00024449419296152707}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.1668778952776008, "res": {"No": 0.8331220324549948, "Yes": 0.1668778952776008}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.011863763602029372, "res": {"No": 0.9881352617495912, "Yes": 0.011863763602029372}, "ground_truth": 1}, {"key": "39471712", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.010455486650817367, "res": {"No": 0.9895439317468621, "Yes": 0.010455486650817367}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.002020151642181062, "res": {"No": 0.9979796655286942, "Yes": 0.002020151642181062}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.9976900897579593e-06, "res": {"No": 0.9999975415208221, "Yes": 1.9976900897579593e-06}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 4.627928986841182e-05, "res": {"No": 0.9999520068687072, "Yes": 4.627928986841182e-05}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.012293823465541519, "res": {"No": 0.9877055904650396, "Yes": 0.012293823465541519}, "ground_truth": 1}, {"key": "39115192", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0015083740445510942, "res": {"No": 0.9984904473225734, "Yes": 0.0015083740445510942}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 4.370561388176159e-05, "res": {"No": 0.9999559404106522, "Yes": 4.370561388176159e-05}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.8570226743598225e-06, "res": {"No": 0.9999930118027176, "Yes": 3.8570226743598225e-06}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.014682123700680977, "res": {"No": 0.9853175864354453, "Yes": 0.014682123700680977}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.494039182809628e-06}, "ground_truth": 1}, {"key": "23520673", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997598965894386, "res": {"Yes": 0.9997598965894386, "No": 0.00023994111953325718}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.10558529175856955, "res": {"No": 0.8944143646992692, "Yes": 0.10558529175856955}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.008447129495502657, "res": {"No": 0.991552743275898, "Yes": 0.008447129495502657}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9894837099357442, "res": {"Yes": 0.9894837099357442, "No": 0.010515926095015808}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.0416709341660465e-06}, "ground_truth": 1}, {"key": "35764233", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999480733442354, "res": {"Yes": 0.9999480733442354, "No": 5.16067025258716e-05}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999948788531352, "res": {"Yes": 0.999948788531352, "No": 5.09675705021233e-05}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.0367320071793613e-05, "res": {"No": 0.9999889589149532, "Yes": 1.0367320071793613e-05}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.3433635192776087e-06, "res": {"No": 0.9999984951481323, "Yes": 1.3433635192776087e-06}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.251461646519479, "res": {"No": 0.7485382456762323, "Yes": 0.251461646519479}, "ground_truth": 1}, {"key": "35228910", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.959777521322992, "res": {"Yes": 0.959777521322992, "No": 0.04022216770073871}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992306904704324, "res": {"Yes": 0.9992306904704324, "No": 0.0007690432101386305}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.007570838132697767, "res": {"No": 0.9924279898105881, "Yes": 0.007570838132697767}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9780992827455363, "res": {"Yes": 0.9780992827455363, "No": 0.021899974643311712}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9957960716504922, "res": {"Yes": 0.9957960716504922, "No": 0.004203612518225239}, "ground_truth": 1}, {"key": "36795599", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999214926618624, "res": {"Yes": 0.9999214926618624, "No": 7.831879072833073e-05}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999983475621529, "res": {"Yes": 0.999983475621529, "No": 1.6322321006579524e-05}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997174894836135, "res": {"Yes": 0.9997174894836135, "No": 0.0002823628816218961}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999957132395842, "res": {"Yes": 0.999957132395842, "No": 4.264647230963406e-05}, "ground_truth": 1}, {"key": "38641949", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.020492301499070928, "res": {"No": 0.9795073919201839, "Yes": 0.020492301499070928}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992840100432235, "res": {"Yes": 0.9992840100432235, "No": 0.0007158706956357154}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.04476528626843556, "res": {"No": 0.9552308537866885, "Yes": 0.04476528626843556}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999676219241812, "res": {"Yes": 0.9999676219241812, "No": 3.220947158708221e-05}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9735003973534618, "res": {"Yes": 0.9735003973534618, "No": 0.026499426174946782}, "ground_truth": 1}, {"key": "29968443", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.271641689262848, "res": {"No": 0.728358191862015, "Yes": 0.271641689262848}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975779318519622, "res": {"Yes": 0.9975779318519622, "No": 0.0024219627834736342}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.847462346180574, "res": {"Yes": 0.847462346180574, "No": 0.15253689160908276}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.4577377303713877, "res": {"No": 0.542261864166741, "Yes": 0.4577377303713877}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999440206399028, "res": {"Yes": 0.9999440206399028, "No": 5.5733341469385316e-05}, "ground_truth": 1}, {"key": "21268042", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9703807196558065, "res": {"Yes": 0.9703807196558065, "No": 0.029619095719424234}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.998265872938883, "res": {"Yes": 0.998265872938883, "No": 0.0017341151425043716}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.0987240565630833e-06, "res": {"No": 0.9999980183344636, "Yes": 1.0987240565630833e-06}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.6853141998306256, "res": {"Yes": 0.6853141998306256, "No": 0.3146850756786323}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995559630436025, "res": {"Yes": 0.9995559630436025, "No": 0.00044360213038882}, "ground_truth": 1}, {"key": "26808572", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999634499379698, "res": {"Yes": 0.9999634499379698, "No": 3.6051070493004674e-05}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9914355536251583, "res": {"Yes": 0.9914355536251583, "No": 0.008563933271753225}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8017815738645055, "res": {"Yes": 0.8017815738645055, "No": 0.19821804833619663}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997003328091847, "res": {"Yes": 0.9997003328091847, "No": 0.00029949944305294443}, "ground_truth": 1}, {"key": "37829390", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0012451989034734043, "res": {"No": 0.9987547095185042, "Yes": 0.0012451989034734043}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 9.30143377809829e-06, "res": {"No": 0.9999902701413353, "Yes": 9.30143377809829e-06}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 9.969151399651434e-05, "res": {"No": 0.9998990843823236, "Yes": 9.969151399651434e-05}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.009369430159525273, "res": {"No": 0.990630020417496, "Yes": 0.009369430159525273}, "ground_truth": 1}, {"key": "35716045", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.09746844445291312, "res": {"No": 0.9025304046316732, "Yes": 0.09746844445291312}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 8.08305152297251e-05, "res": {"No": 0.9999188703911848, "Yes": 8.08305152297251e-05}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.5999897543470732, "res": {"Yes": 0.5999897543470732, "No": 0.4000088128467434}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.006466794071478606, "res": {"No": 0.9935324204112972, "Yes": 0.006466794071478606}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0009301900852131526, "res": {"No": 0.9990678940808556, "Yes": 0.0009301900852131526}, "ground_truth": 1}, {"key": "34367070", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 7.52846722240725e-05, "res": {"No": 0.9999200623291858, "Yes": 7.52846722240725e-05}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00039991441350013444, "res": {"No": 0.9995997968026719, "Yes": 0.00039991441350013444}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0015434856671595974, "res": {"No": 0.9984533674707414, "Yes": 0.0015434856671595974}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0007202563987291609, "res": {"No": 0.9992790107777264, "Yes": 0.0007202563987291609}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.007170332153430602, "res": {"No": 0.9928293471964225, "Yes": 0.007170332153430602}, "ground_truth": 1}, {"key": "35239748", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.009648121941816634, "res": {"No": 0.9903508496997324, "Yes": 0.009648121941816634}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.3514972581200037e-06, "res": {"No": 0.9999984951481323, "Yes": 1.3514972581200037e-06}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.05066240815037463, "res": {"No": 0.9493374203345133, "Yes": 0.05066240815037463}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 6.349039013340249e-05, "res": {"No": 0.9999361536682638, "Yes": 6.349039013340249e-05}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999956342685299, "res": {"Yes": 0.9999956342685299, "No": 4.229084578620976e-06}, "ground_truth": 1}, {"key": "40421370", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9938077392614654, "res": {"Yes": 0.9938077392614654, "No": 0.006191012099981079}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990938309793469, "res": {"Yes": 0.9990938309793469, "No": 0.0009046178216282635}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.2241773274292188, "res": {"No": 0.7758218188876059, "Yes": 0.2241773274292188}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999539140419904, "res": {"Yes": 0.9999539140419904, "No": 4.524759673760166e-05}, "ground_truth": 1}, {"key": "37288396", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993318674000538, "res": {"Yes": 0.9993318674000538, "No": 0.0006675970399860562}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.2327940550913736, "res": {"No": 0.7672053362113412, "Yes": 0.2327940550913736}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9973184417178409, "res": {"Yes": 0.9973184417178409, "No": 0.0026810405362980606}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.015088320670045148, "res": {"No": 0.984911525176635, "Yes": 0.015088320670045148}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.07817374730555564, "res": {"No": 0.9218258150899933, "Yes": 0.07817374730555564}, "ground_truth": 1}, {"key": "38903688", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9946587639983805, "res": {"Yes": 0.9946587639983805, "No": 0.005339202402465225}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999900317366834, "res": {"Yes": 0.9999900317366834, "No": 9.001232910092958e-06}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.008281493106250924, "res": {"No": 0.9917181520347251, "Yes": 0.008281493106250924}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8941176794294463, "res": {"Yes": 0.8941176794294463, "No": 0.10588174720628413}, "ground_truth": 1}, {"key": "28071228", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998857350087414, "res": {"Yes": 0.9998857350087414, "No": 0.00011399573757064237}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.0652313374339e-07}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.024545091098252272, "res": {"No": 0.9754548665310839, "Yes": 0.024545091098252272}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.008636887535625831, "res": {"No": 0.991363018887811, "Yes": 0.008636887535625831}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.021985217132613002, "res": {"No": 0.9780147864422561, "Yes": 0.021985217132613002}, "ground_truth": 1}, {"key": "36855834", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.09640026773841921, "res": {"No": 0.9035992865071395, "Yes": 0.09640026773841921}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.04141529590841215, "res": {"No": 0.9585845832061551, "Yes": 0.04141529590841215}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.170096127525842e-05, "res": {"No": 0.9999689331225854, "Yes": 2.170096127525842e-05}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0005298822743283764, "res": {"No": 0.9994667670892281, "Yes": 0.0005298822743283764}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2969919336428338, "res": {"No": 0.702997692175333, "Yes": 0.2969919336428338}, "ground_truth": 1}, {"key": "40548717", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9429213574082328, "res": {"Yes": 0.9429213574082328, "No": 0.057075535740784694}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971701239693133, "res": {"Yes": 0.9971701239693133, "No": 0.0028291733852818454}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.001405113776162499, "res": {"No": 0.9985948018168358, "Yes": 0.001405113776162499}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.006940021545009606, "res": {"No": 0.9930596035721487, "Yes": 0.006940021545009606}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999881244990143, "res": {"Yes": 0.9999881244990143, "No": 1.139245800513929e-05}, "ground_truth": 1}, {"key": "37051175", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994371162785147, "res": {"Yes": 0.9994371162785147, "No": 0.0005624554651987753}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9331849091907116, "res": {"Yes": 0.9331849091907116, "No": 0.06681442357271847}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9989152601560678, "res": {"Yes": 0.9989152601560678, "No": 0.0010846954745522054}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3445561885797739, "res": {"No": 0.655443534894836, "Yes": 0.3445561885797739}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9869420110600938, "res": {"Yes": 0.9869420110600938, "No": 0.013057795072198713}, "ground_truth": 1}, {"key": "38882119", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.98388389674912, "res": {"Yes": 0.98388389674912, "No": 0.01611607593317921}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9023032518785316, "res": {"Yes": 0.9023032518785316, "No": 0.09769663135556905}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00035493584611103385, "res": {"No": 0.9996449359501648, "Yes": 0.00035493584611103385}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.7080627919685202, "res": {"Yes": 0.7080627919685202, "No": 0.2919372491439974}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.346053334784254e-07}, "ground_truth": 1}, {"key": "19485402", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6336689004481423, "res": {"Yes": 0.6336689004481423, "No": 0.3663311401925787}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998086367022921, "res": {"Yes": 0.9998086367022921, "No": 0.00019098245362027616}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00687377041604561, "res": {"No": 0.9931257922073459, "Yes": 0.00687377041604561}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3068017209960632, "res": {"No": 0.6931973111799383, "Yes": 0.3068017209960632}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.006401696151866211, "res": {"No": 0.9935977340013279, "Yes": 0.006401696151866211}, "ground_truth": 1}, {"key": "36060907", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995592955887298, "res": {"Yes": 0.9995592955887298, "No": 0.00044055630504320173}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.20375760548990604, "res": {"No": 0.7962421029079134, "Yes": 0.20375760548990604}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.01913548144465563, "res": {"No": 0.9808640304796162, "Yes": 0.01913548144465563}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.013430984031291874, "res": {"No": 0.9865689572994327, "Yes": 0.013430984031291874}, "ground_truth": 1}, {"key": "24037309", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989498784639336, "res": {"Yes": 0.9989498784639336, "No": 0.0010496962944842117}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00014656361378010815, "res": {"No": 0.9998530848030946, "Yes": 0.00014656361378010815}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0008485339180144622, "res": {"No": 0.9991514235448115, "Yes": 0.0008485339180144622}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9134351466926002, "res": {"Yes": 0.9134351466926002, "No": 0.08656411722771097}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.992363058760811, "res": {"Yes": 0.992363058760811, "No": 0.007636621390415802}, "ground_truth": 1}, {"key": "35605805", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.09705790692416048, "res": {"No": 0.9029420162270495, "Yes": 0.09705790692416048}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.02503802524193888, "res": {"No": 0.9749618041328685, "Yes": 0.02503802524193888}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0007458306457153581, "res": {"No": 0.9992522389127694, "Yes": 0.0007458306457153581}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.83478622906837, "res": {"Yes": 0.83478622906837, "No": 0.16521335165581594}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.0446601852536415e-07}, "ground_truth": 1}, {"key": "17706248", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 7.55102753203091e-07}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9975787642313358, "res": {"Yes": 0.9975787642313358, "No": 0.0024208561993553147}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.9502103266220644e-05, "res": {"No": 0.9999696483206215, "Yes": 2.9502103266220644e-05}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00368804046970741, "res": {"No": 0.9963113762480799, "Yes": 0.00368804046970741}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988902877865004, "res": {"Yes": 0.9988902877865004, "No": 0.0011092893432497577}, "ground_truth": 1}, {"key": "36883559", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9190892269410088, "res": {"Yes": 0.9190892269410088, "No": 0.08091059494655625}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0010768774237059926, "res": {"No": 0.9989200194991628, "Yes": 0.0010768774237059926}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.027102741333356765, "res": {"No": 0.9728962562887375, "Yes": 0.027102741333356765}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6748951388699075, "res": {"Yes": 0.6748951388699075, "No": 0.3251042106159246}, "ground_truth": 1}, {"key": "32799471", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07827140035404205, "res": {"No": 0.9217281694097416, "Yes": 0.07827140035404205}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.000594501689472379, "res": {"No": 0.9994038960805794, "Yes": 0.000594501689472379}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999515300767047, "res": {"Yes": 0.9999515300767047, "No": 4.825413665846594e-05}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998685791264796, "res": {"Yes": 0.9998685791264796, "No": 0.00013124759243672758}, "ground_truth": 1}, {"key": "34797243", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.322392449698877e-06}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988346225802949, "res": {"Yes": 0.9988346225802949, "No": 0.0011651868716245637}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 7.539415438457082e-07, "res": {"No": 0.9999989719621284, "Yes": 7.539415438457082e-07}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.04677289549144291, "res": {"No": 0.9532270367171263, "Yes": 0.04677289549144291}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995299958465729, "res": {"Yes": 0.9995299958465729, "No": 0.0004697346956396231}, "ground_truth": 1}, {"key": "32154876", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999994561441089, "res": {"Yes": 0.999994561441089, "No": 5.133573769989688e-06}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 7.291761512782744e-07}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.2684152614211953e-05, "res": {"No": 0.9999770387506135, "Yes": 2.2684152614211953e-05}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999912237625114, "res": {"Yes": 0.9999912237625114, "No": 8.551498732724788e-06}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9949843990432343, "res": {"Yes": 0.9949843990432343, "No": 0.005015435609622437}, "ground_truth": 1}, {"key": "37962274", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9948451580339351, "res": {"Yes": 0.9948451580339351, "No": 0.005154495667272596}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999323394050813, "res": {"Yes": 0.9999323394050813, "No": 6.742524872713585e-05}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0005912464632465732, "res": {"No": 0.9994084194528139, "Yes": 0.0005912464632465732}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.999934961715081, "res": {"Yes": 0.999934961715081, "No": 6.453431242693593e-05}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.995485869453524, "res": {"Yes": 0.995485869453524, "No": 0.004513628064372632}, "ground_truth": 1}, {"key": "35574030", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.006275134876075423, "res": {"No": 0.9937247312597783, "Yes": 0.006275134876075423}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999088581436714, "res": {"Yes": 0.9999088581436714, "No": 9.100746698804992e-05}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.0276007221352225e-05, "res": {"No": 0.9999695291212467, "Yes": 3.0276007221352225e-05}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.43652911713723225, "res": {"No": 0.5634708089216706, "Yes": 0.43652911713723225}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.09395787833118088, "res": {"No": 0.9060420184812137, "Yes": 0.09395787833118088}, "ground_truth": 1}, {"key": "39105949", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5605684056152965, "res": {"Yes": 0.5605684056152965, "No": 0.43943158038730934}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.5054660014770486, "res": {"Yes": 0.5054660014770486, "No": 0.4945335074263125}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 4.92824849932036e-07, "res": {"No": 0.9999989719621284, "Yes": 4.92824849932036e-07}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00021673980048429482, "res": {"No": 0.9997827784660145, "Yes": 0.00021673980048429482}, "ground_truth": 1}, {"key": "41064322", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0393655354997182e-05, "res": {"No": 0.9999893165220688, "Yes": 1.0393655354997182e-05}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.8891244447146115e-05, "res": {"No": 0.9999807339855921, "Yes": 1.8891244447146115e-05}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0010108086751779248, "res": {"No": 0.9989881857296089, "Yes": 0.0010108086751779248}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8557218904192844, "res": {"Yes": 0.8557218904192844, "No": 0.144276699336519}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9943815763109501, "res": {"Yes": 0.9943815763109501, "No": 0.00561781601519862}, "ground_truth": 1}, {"key": "28105101", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.810687974966741, "res": {"Yes": 0.810687974966741, "No": 0.1893112676164918}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.10512572123240783, "res": {"No": 0.8948732955025953, "Yes": 0.10512572123240783}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0009530949752897682, "res": {"No": 0.9990461187342505, "Yes": 0.0009530949752897682}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.003320255304714253, "res": {"No": 0.9966796406257388, "Yes": 0.003320255304714253}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.07126908756941058, "res": {"No": 0.9287308056758143, "Yes": 0.07126908756941058}, "ground_truth": 1}, {"key": "36036068", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9630354979744478, "res": {"Yes": 0.9630354979744478, "No": 0.03696395612214431}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.4468122477543381, "res": {"No": 0.553187320354071, "Yes": 0.4468122477543381}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.975272605187113, "res": {"Yes": 0.975272605187113, "No": 0.024727220441126806}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999919585553415, "res": {"Yes": 0.999919585553415, "No": 7.994984958895216e-05}, "ground_truth": 1}, {"key": "37991460", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99793122137843, "res": {"Yes": 0.99793122137843, "No": 0.002068533452182413}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.903446133986983, "res": {"Yes": 0.903446133986983, "No": 0.09655321228232627}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.6587778384067267e-06, "res": {"No": 0.9999967070975216, "Yes": 2.6587778384067267e-06}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9550092449235912, "res": {"Yes": 0.9550092449235912, "No": 0.044989398763463674}, "ground_truth": 1}, {"key": "38437830", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.07667703720374427, "res": {"No": 0.9233229306281844, "Yes": 0.07667703720374427}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.2889584188366737e-05, "res": {"No": 0.999983475621529, "Yes": 1.2889584188366737e-05}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 8.996192794200804e-05, "res": {"No": 0.9999085005663285, "Yes": 8.996192794200804e-05}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999938462231346, "res": {"Yes": 0.9999938462231346, "No": 5.8914583106740544e-06}, "ground_truth": 1}, {"key": "36507138", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9929167840664543, "res": {"Yes": 0.9929167840664543, "No": 0.007082204851883641}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.03247612743548742, "res": {"No": 0.9675229204221509, "Yes": 0.03247612743548742}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.988581174148716e-06, "res": {"No": 0.9999893165220688, "Yes": 9.988581174148716e-06}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0007327582642746187, "res": {"No": 0.999265807051635, "Yes": 0.0007327582642746187}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2207199887594163, "res": {"No": 0.7792792460621114, "Yes": 0.2207199887594163}, "ground_truth": 1}, {"key": "37824866", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.002351330360865168, "res": {"No": 0.9976476988067997, "Yes": 0.002351330360865168}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8297663946794742, "res": {"Yes": 0.8297663946794742, "No": 0.17023289651458992}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.06626046263624934, "res": {"No": 0.9337385546623045, "Yes": 0.06626046263624934}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9971734484403313, "res": {"Yes": 0.9971734484403313, "No": 0.00282479354067874}, "ground_truth": 1}, {"key": "25088134", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6219570500460645, "res": {"Yes": 0.6219570500460645, "No": 0.3780398370100858}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.6942909708419772, "res": {"Yes": 0.6942909708419772, "No": 0.30570619051376996}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0010392208804478836, "res": {"No": 0.9989603464146611, "Yes": 0.0010392208804478836}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0007871641928388888, "res": {"No": 0.9992126002619988, "Yes": 0.0007871641928388888}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2919434674736291, "res": {"No": 0.7080563344653037, "Yes": 0.2919434674736291}, "ground_truth": 1}, {"key": "40172531", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1917695093948062, "res": {"No": 0.8082302970260394, "Yes": 0.1917695093948062}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0001285200030480595, "res": {"No": 0.9998712012652693, "Yes": 0.0001285200030480595}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995933624294768, "res": {"Yes": 0.9995933624294768, "No": 0.00040568441645023607}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999249493064443, "res": {"Yes": 0.9999249493064443, "No": 7.364362329491481e-05}, "ground_truth": 1}, {"key": "37035874", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989538044445656, "res": {"Yes": 0.9989538044445656, "No": 0.0010444996625927688}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.07012827597566, "res": {"No": 0.9298681472841293, "Yes": 0.07012827597566}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.353867881560124e-07, "res": {"No": 0.9999983759447187, "Yes": 8.353867881560124e-07}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0003882315958081693, "res": {"No": 0.9996109902139353, "Yes": 0.0003882315958081693}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9895539746791882, "res": {"Yes": 0.9895539746791882, "No": 0.010444827491528915}, "ground_truth": 1}, {"key": "36404465", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.018166991234888394, "res": {"No": 0.9818327478550047, "Yes": 0.018166991234888394}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.3450578966506545e-06, "res": {"No": 0.9999982567412194, "Yes": 1.3450578966506545e-06}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.1982048339110556e-05, "res": {"No": 0.9999872900832717, "Yes": 1.1982048339110556e-05}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00027238773783286156, "res": {"No": 0.9997272578209124, "Yes": 0.00027238773783286156}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997197537263252, "res": {"Yes": 0.9997197537263252, "No": 0.0002799203386767683}, "ground_truth": 1}, {"key": "39602052", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988727991686613, "res": {"Yes": 0.9988727991686613, "No": 0.001127091340204143}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.5361559332381435, "res": {"Yes": 0.5361559332381435, "No": 0.4638432532964789}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0002482220126411762, "res": {"No": 0.9997514461946165, "Yes": 0.0002482220126411762}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.2634328052231433e-05, "res": {"No": 0.9999851444463448, "Yes": 1.2634328052231433e-05}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9817785119302177, "res": {"Yes": 0.9817785119302177, "No": 0.01821997790189232}, "ground_truth": 1}, {"key": "33792789", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9749419736114495, "res": {"Yes": 0.9749419736114495, "No": 0.025057106476687713}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7411348992390935, "res": {"Yes": 0.7411348992390935, "No": 0.25886398750182793}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.4771114607242345e-05, "res": {"No": 0.9999851444463448, "Yes": 1.4771114607242345e-05}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.38798011138099514, "res": {"No": 0.6120198269606844, "Yes": 0.38798011138099514}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.05902563723796313, "res": {"No": 0.9409742069758515, "Yes": 0.05902563723796313}, "ground_truth": 1}, {"key": "32776626", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.005813034240199217, "res": {"No": 0.9941869969646732, "Yes": 0.005813034240199217}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0009132690800821345, "res": {"No": 0.9990866888827148, "Yes": 0.0009132690800821345}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.1753799593349925e-05, "res": {"No": 0.9999866940725246, "Yes": 1.1753799593349925e-05}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9926510019209128, "res": {"Yes": 0.9926510019209128, "No": 0.007348970820378706}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 7.248276025169254e-07}, "ground_truth": 1}, {"key": "37195090", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.195567505954749e-06}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.0, "res": {"Yes": 1.0, " Yes": 1.3927465655294988e-08}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.5203620008702482e-05, "res": {"No": 0.9999788267671561, "Yes": 1.5203620008702482e-05}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0037092829350716724, "res": {"No": 0.9962891292619569, "Yes": 0.0037092829350716724}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6490835591171327, "res": {"Yes": 0.6490835591171327, "No": 0.35091519303319174}, "ground_truth": 1}, {"key": "33981824", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.04646868658514891, "res": {"No": 0.9535305286425902, "Yes": 0.04646868658514891}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995403617160561, "res": {"Yes": 0.9995403617160561, "No": 0.0004564558850264188}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00045108083476950474, "res": {"No": 0.9995434523196234, "Yes": 0.00045108083476950474}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.29411421520299735, "res": {"No": 0.7058825465422965, "Yes": 0.29411421520299735}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.005096095095877027, "res": {"No": 0.9949006045878039, "Yes": 0.005096095095877027}, "ground_truth": 1}, {"key": "39569142", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0042401255471489685, "res": {"No": 0.9957584817553452, "Yes": 0.0042401255471489685}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.001675283791994503, "res": {"No": 0.998323373710876, "Yes": 0.001675283791994503}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 6.697421207909891e-06, "res": {"No": 0.9999925349918634, "Yes": 6.697421207909891e-06}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999964686909351, "res": {"Yes": 0.9999964686909351, "No": 3.2814603696708962e-06}, "ground_truth": 1}, {"key": "40268210", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0015164741148331648, "res": {"No": 0.9984830788896564, "Yes": 0.0015164741148331648}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.981991012411502, "res": {"Yes": 0.981991012411502, "No": 0.018008790125135125}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5711665389170215, "res": {"Yes": 0.5711665389170215, "No": 0.4288329199075153}, "ground_truth": 1}, {"key": "34925159", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.09566115182316487, "res": {"No": 0.9043384563883236, "Yes": 0.09566115182316487}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.618481663447419e-05, "res": {"No": 0.9999828796125555, "Yes": 1.618481663447419e-05}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0067132687537929435, "res": {"No": 0.9932865406386182, "Yes": 0.0067132687537929435}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0071735401604201025, "res": {"No": 0.9928264099151438, "Yes": 0.0071735401604201025}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 7.797385342273495e-05, "res": {"No": 0.9999214926618624, "Yes": 7.797385342273495e-05}, "ground_truth": 1}, {"key": "36181903", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0011869959207089266, "res": {"No": 0.9988127368552375, "Yes": 0.0011869959207089266}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 8.551198640296281e-05, "res": {"No": 0.9999141026393895, "Yes": 8.551198640296281e-05}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.8244976641803663, "res": {"Yes": 0.8244976641803663, "No": 0.17550148053762094}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.979858078168593, "res": {"Yes": 0.979858078168593, "No": 0.020140902124874956}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9479727821040373, "res": {"Yes": 0.9479727821040373, "No": 0.05202649348763084}, "ground_truth": 1}, {"key": "38620559", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9960466222550967, "res": {"Yes": 0.9960466222550967, "No": 0.003952665964535066}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.534491420551213, "res": {"Yes": 0.534491420551213, "No": 0.4655075329053142}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.2415932885784057e-05, "res": {"No": 0.9999870516788303, "Yes": 1.2415932885784057e-05}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0001993353451513816, "res": {"No": 0.999798863910576, "Yes": 0.0001993353451513816}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9399535996602482, "res": {"Yes": 0.9399535996602482, "No": 0.060045918567599596}, "ground_truth": 1}, {"key": "32719657", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7311830062628921, "res": {"Yes": 0.7311830062628921, "No": 0.2688169000767999}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8751533944905259, "res": {"Yes": 0.8751533944905259, "No": 0.12484590027501911}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4508607254145535, "res": {"No": 0.5491389900635154, "Yes": 0.4508607254145535}, "ground_truth": 1}, {"key": "37530914", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992885365602201, "res": {"Yes": 0.9992885365602201, "No": 0.0007113168410980697}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9873870490082266, "res": {"Yes": 0.9873870490082266, "No": 0.01261282658350479}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.8289105559691058e-05, "res": {"No": 0.9999800187796273, "Yes": 1.8289105559691058e-05}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.2211330864359153e-05, "res": {"No": 0.999977753956447, "Yes": 2.2211330864359153e-05}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999971839107652, "res": {"Yes": 0.9999971839107652, "No": 2.2078993827377345e-06}, "ground_truth": 1}, {"key": "33306933", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997110543328424, "res": {"Yes": 0.9997110543328424, "No": 0.0002885281220471848}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.2634934418303032, "res": {"No": 0.7365062625446419, "Yes": 0.2634934418303032}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9959870199113291, "res": {"Yes": 0.9959870199113291, "No": 0.004012313385075302}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00014273882445834442, "res": {"No": 0.9998566603941031, "Yes": 0.00014273882445834442}, "ground_truth": 1}, {"key": "33837212", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998675064280487, "res": {"Yes": 0.9998675064280487, "No": 0.00013218303064746863}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.6649041562542306e-06, "res": {"No": 0.9999971839107652, "Yes": 1.6649041562542306e-06}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.06364538897777275, "res": {"No": 0.9363544390357736, "Yes": 0.06364538897777275}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995651340216308, "res": {"Yes": 0.9995651340216308, "No": 0.0004343179883938481}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999397295583361, "res": {"Yes": 0.9999397295583361, "No": 5.991093591344864e-05}, "ground_truth": 1}, {"key": "40945179", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999841908319662, "res": {"Yes": 0.9999841908319662, "No": 1.5642030561132537e-05}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8815451666997195, "res": {"Yes": 0.8815451666997195, "No": 0.11845432923440902}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0519413698185698, "res": {"No": 0.9480584950419093, "Yes": 0.0519413698185698}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997926665865435, "res": {"Yes": 0.9997926665865435, "No": 0.00020709850672382597}, "ground_truth": 1}, {"key": "34152358", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999813299942867, "res": {"Yes": 0.9999813299942867, "No": 1.8246632783000323e-05}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992677129531263, "res": {"Yes": 0.9992677129531263, "No": 0.0007317372913634098}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.376649445933645e-05, "res": {"No": 0.9999560596094073, "Yes": 4.376649445933645e-05}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.21294580122381473, "res": {"No": 0.7870535576167379, "Yes": 0.21294580122381473}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999937270200753, "res": {"Yes": 0.9999937270200753, "No": 6.235336567102903e-06}, "ground_truth": 1}, {"key": "34136541", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999361536682638, "res": {"Yes": 0.9999361536682638, "No": 6.36050301714269e-05}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.45895009514816404, "res": {"No": 0.5410498284679588, "Yes": 0.45895009514816404}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 9.88243031657909e-05, "res": {"No": 0.9998996803423534, "Yes": 9.88243031657909e-05}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9928457958343208, "res": {"Yes": 0.9928457958343208, "No": 0.007153975949331982}, "ground_truth": 1}, {"key": "37469603", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.026151048334534938, "res": {"No": 0.9738488238881305, "Yes": 0.026151048334534938}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 9.164217192846741e-05, "res": {"No": 0.9999069510593213, "Yes": 9.164217192846741e-05}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.009233958954013265, "res": {"No": 0.9907658649191818, "Yes": 0.009233958954013265}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998338996861849, "res": {"Yes": 0.9998338996861849, "No": 0.00016571203581330866}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991357205548188, "res": {"Yes": 0.9991357205548188, "No": 0.0008640620280608731}, "ground_truth": 1}, {"key": "37353611", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982362942601526, "res": {"Yes": 0.9982362942601526, "No": 0.0017632810015153631}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9709150894625591, "res": {"Yes": 0.9709150894625591, "No": 0.02908449688095219}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0005986155413815874, "res": {"No": 0.9994012751572927, "Yes": 0.0005986155413815874}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3157961084712934, "res": {"No": 0.6842037675156853, "Yes": 0.3157961084712934}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8517851800806804, "res": {"Yes": 0.8517851800806804, "No": 0.14821413393294477}, "ground_truth": 1}, {"key": "37211649", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9245703831582942, "res": {"Yes": 0.9245703831582942, "No": 0.07542895945912205}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983427387765006, "res": {"Yes": 0.9983427387765006, "No": 0.0016565249076928507}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0036127887425650043, "res": {"No": 0.9963869919774037, "Yes": 0.0036127887425650043}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.998960703642945, "res": {"Yes": 0.998960703642945, "No": 0.0010388481787661102}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999920539107184, "res": {"Yes": 0.999920539107184, "No": 7.919115061862439e-05}, "ground_truth": 1}, {"key": "37320976", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8955081065337595, "res": {"Yes": 0.8955081065337595, "No": 0.10449156798202942}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999502733378049, "res": {"Yes": 0.999502733378049, "No": 0.0004968127318281392}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.2724758170387764e-05, "res": {"No": 0.9999862172649827, "Yes": 1.2724758170387764e-05}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.5884092726127725e-06, "res": {"No": 0.9999980183344636, "Yes": 1.5884092726127725e-06}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00016947214176844444, "res": {"No": 0.9998297282578789, "Yes": 0.00016947214176844444}, "ground_truth": 1}, {"key": "34492412", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07579292715410459, "res": {"No": 0.9241978609840618, "Yes": 0.07579292715410459}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.007997422313786771, "res": {"No": 0.992002084885877, "Yes": 0.007997422313786771}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.10806235039174651, "res": {"No": 0.8919370594913784, "Yes": 0.10806235039174651}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8977539015186072, "res": {"Yes": 0.8977539015186072, "No": 0.10224544834636719}, "ground_truth": 1}, {"key": "36655016", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.010444001338349126, "res": {"No": 0.989554910797691, "Yes": 0.010444001338349126}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 2.001391052353037e-05, "res": {"No": 0.9999784691637917, "Yes": 2.001391052353037e-05}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00018677852524374522, "res": {"No": 0.9998131655857234, "Yes": 0.00018677852524374522}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.404598769820426e-06, "res": {"No": 0.9999959918780326, "Yes": 2.404598769820426e-06}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999490269261713, "res": {"Yes": 0.9999490269261713, "No": 5.066364326337327e-05}, "ground_truth": 1}, {"key": "35220773", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.37582609721075255, "res": {"No": 0.6241731906523412, "Yes": 0.37582609721075255}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.08957180364401959, "res": {"No": 0.910428045859391, "Yes": 0.08957180364401959}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.3046352045715847e-05, "res": {"No": 0.9999866940725246, "Yes": 1.3046352045715847e-05}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 8.772066969340392e-05, "res": {"No": 0.9999117187730169, "Yes": 8.772066969340392e-05}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.09775111241273339, "res": {"No": 0.9022486154616608, "Yes": 0.09775111241273339}, "ground_truth": 1}, {"key": "31569808", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.014117243295604893, "res": {"No": 0.9858817554988986, "Yes": 0.014117243295604893}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.005071381567395091, "res": {"No": 0.9949276321262673, "Yes": 0.005071381567395091}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.957390424080644e-05, "res": {"No": 0.999929955493231, "Yes": 6.957390424080644e-05}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.4918387107080065, "res": {"No": 0.5081603355703868, "Yes": 0.4918387107080065}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974116475756619, "res": {"Yes": 0.9974116475756619, "No": 0.002587262789884638}, "ground_truth": 1}, {"key": "37696256", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998304433663511, "res": {"Yes": 0.9998304433663511, "No": 0.00016838576341849444}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9628368692768108, "res": {"Yes": 0.9628368692768108, "No": 0.03716088311924995}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984345881373411, "res": {"Yes": 0.9984345881373411, "No": 0.0015652411146313608}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9800549788732933, "res": {"Yes": 0.9800549788732933, "No": 0.019944995883846406}, "ground_truth": 1}, {"key": "36874328", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9200670473869345, "res": {"Yes": 0.9200670473869345, "No": 0.07993250403384482}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.22127506795958082, "res": {"No": 0.778724822547679, "Yes": 0.22127506795958082}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.2030193936853169e-06}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999398487531588, "res": {"Yes": 0.9999398487531588, "No": 5.963505414464734e-05}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999759659438225, "res": {"Yes": 0.9999759659438225, "No": 2.320306908255817e-05}, "ground_truth": 1}, {"key": "24532377", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995266633991314, "res": {"Yes": 0.9995266633991314, "No": 0.0004728758393591096}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999962302846054, "res": {"Yes": 0.9999962302846054, "No": 3.019645855030339e-06}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0002041925779210122, "res": {"No": 0.999795526887477, "Yes": 0.0002041925779210122}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.06677830677894782, "res": {"No": 0.9332214487611799, "Yes": 0.06677830677894782}, "ground_truth": 1}, {"key": "39560618", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8380559873932413, "res": {"Yes": 0.8380559873932413, "No": 0.16194357611583693}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 3.5930576675123573e-06, "res": {"No": 0.9999963494876631, "Yes": 3.5930576675123573e-06}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.984073871583738, "res": {"Yes": 0.984073871583738, "No": 0.01592447094085665}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999412791111388, "res": {"Yes": 0.9999412791111388, "No": 5.7872224703206526e-05}, "ground_truth": 1}, {"key": "34922693", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988444940117654, "res": {"Yes": 0.9988444940117654, "No": 0.0011550172500634942}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999555828164723, "res": {"Yes": 0.9999555828164723, "No": 4.392284438481221e-05}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8204675239825887, "res": {"Yes": 0.8204675239825887, "No": 0.17953218203872554}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999537948404913, "res": {"Yes": 0.9999537948404913, "No": 4.5718341264492487e-05}, "ground_truth": 1}, {"key": "33629577", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 2.5201629394986605e-06}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9552991657427726, "res": {"Yes": 0.9552991657427726, "No": 0.0447005577415884}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00013809634006001968, "res": {"No": 0.9998617854325136, "Yes": 0.00013809634006001968}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989026493300779, "res": {"Yes": 0.9989026493300779, "No": 0.001097220297181723}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 1.8220707899388088e-07}, "ground_truth": 1}, {"key": "32284359", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999798995780161, "res": {"Yes": 0.9999798995780161, "No": 1.9735628547053354e-05}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998277021549788, "res": {"Yes": 0.9998277021549788, "No": 0.0001721392182697858}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.6795754391455184, "res": {"Yes": 0.6795754391455184, "No": 0.32042392317073987}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3429560411300801, "res": {"No": 0.6570425227429066, "Yes": 0.3429560411300801}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9815442816320886, "res": {"Yes": 0.9815442816320886, "No": 0.018453921198373063}, "ground_truth": 1}, {"key": "28082962", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9601979575466345, "res": {"Yes": 0.9601979575466345, "No": 0.03979936187944706}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0011702517293781143, "res": {"No": 0.9988292720373195, "Yes": 0.0011702517293781143}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9837433678263093, "res": {"Yes": 0.9837433678263093, "No": 0.016256518697994243}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9786210970105989, "res": {"Yes": 0.9786210970105989, "No": 0.02137718814589726}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 5.90477680294792e-07}, "ground_truth": 1}, {"key": "24796803", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999844292352256, "res": {"Yes": 0.9999844292352256, "No": 1.5197190237431304e-05}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, " Yes": 1.8932608331062527e-07}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.060402616404691e-06, "res": {"No": 0.9999870516788303, "Yes": 9.060402616404691e-06}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.19761325815363395, "res": {"No": 0.8023857513756432, "Yes": 0.19761325815363395}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0015656166610197497, "res": {"No": 0.998434350210407, "Yes": 0.0015656166610197497}, "ground_truth": 1}, {"key": "35466150", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06008770704758438, "res": {"No": 0.9399119954148376, "Yes": 0.06008770704758438}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.06491739911901744, "res": {"No": 0.935081984107494, "Yes": 0.06491739911901744}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9999891973193493, "res": {"Yes": 0.9999891973193493, "No": 1.0607630047367479e-05}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9977801262721592, "res": {"Yes": 0.9977801262721592, "No": 0.00221982436742529}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999262829213989, "res": {"Yes": 0.999262829213989, "No": 0.0007370619590804112}, "ground_truth": 1}, {"key": "35754289", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9972590433998094, "res": {"Yes": 0.9972590433998094, "No": 0.002740898753884082}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.989760981333108, "res": {"Yes": 0.989760981333108, "No": 0.010238194431158995}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0005321607247809734, "res": {"No": 0.9994674819081155, "Yes": 0.0005321607247809734}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 6.12229156380731e-05, "res": {"No": 0.9999385375988907, "Yes": 6.12229156380731e-05}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6169915996495394, "res": {"Yes": 0.6169915996495394, "No": 0.38300819238158745}, "ground_truth": 1}, {"key": "36678662", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 4.170531801287868e-06, "res": {"No": 0.9999951574563252, "Yes": 4.170531801287868e-06}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0022946737555935392, "res": {"No": 0.997705005136906, "Yes": 0.0022946737555935392}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00014485562517775307, "res": {"No": 0.9998492708507798, "Yes": 0.00014485562517775307}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.906589298436896e-06, "res": {"No": 0.999992773397112, "Yes": 5.906589298436896e-06}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1238474391858173, "res": {"No": 0.8761524355494325, "Yes": 0.1238474391858173}, "ground_truth": 1}, {"key": "35399671", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00082684467334037, "res": {"No": 0.9991714184134609, "Yes": 0.00082684467334037}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.004486850369966408, "res": {"No": 0.9955130388237245, "Yes": 0.004486850369966408}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.797350192449991e-05, "res": {"No": 0.9999816875976741, "Yes": 1.797350192449991e-05}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0003315877756928869, "res": {"No": 0.9996679270084451, "Yes": 0.0003315877756928869}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.005939216836541949, "res": {"No": 0.9940601123031868, "Yes": 0.005939216836541949}, "ground_truth": 1}, {"key": "36888180", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.04129006767783952, "res": {"No": 0.9587094728648499, "Yes": 0.04129006767783952}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0028282037108570642, "res": {"No": 0.997170717983733, "Yes": 0.0028282037108570642}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.828250319328033e-05, "res": {"No": 0.9999284059529762, "Yes": 6.828250319328033e-05}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0032174022489893385, "res": {"No": 0.9967823198643089, "Yes": 0.0032174022489893385}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9879141576288808, "res": {"Yes": 0.9879141576288808, "No": 0.01208543464274644}, "ground_truth": 1}, {"key": "28061069", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 2.608557947125052e-06}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999932502087799, "res": {"Yes": 0.9999932502087799, "No": 6.444947934749085e-06}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0015289612434530408, "res": {"No": 0.9984707151496316, "Yes": 0.0015289612434530408}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.976579127697529, "res": {"Yes": 0.976579127697529, "No": 0.023419920859564007}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994073472880366, "res": {"Yes": 0.9994073472880366, "No": 0.0005922279183262166}, "ground_truth": 1}, {"key": "22259982", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997202304028145, "res": {"Yes": 0.9997202304028145, "No": 0.00027931957543013495}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999816875976741, "res": {"Yes": 0.9999816875976741, "No": 1.8159022742102777e-05}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9828251278981743, "res": {"Yes": 0.9828251278981743, "No": 0.017169864427464404}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.6187326122959948e-05, "res": {"No": 0.999972151525776, "Yes": 2.6187326122959948e-05}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0035518964743917543, "res": {"No": 0.9964474746030875, "Yes": 0.0035518964743917543}, "ground_truth": 1}, {"key": "34026805", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9441554998356871, "res": {"Yes": 0.9441554998356871, "No": 0.05584254192413905}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 8.897324005294098e-06, "res": {"No": 0.9999872900832717, "Yes": 8.897324005294098e-06}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00012116612743485905, "res": {"No": 0.999878702827097, "Yes": 0.00012116612743485905}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.1352730433226016, "res": {"No": 0.8647264455381113, "Yes": 0.1352730433226016}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9772671003721548, "res": {"Yes": 0.9772671003721548, "No": 0.022732521831489803}, "ground_truth": 1}, {"key": "36713809", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984847378706702, "res": {"Yes": 0.9984847378706702, "No": 0.0015148291782626276}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.458215995565921, "res": {"No": 0.5417837512992688, "Yes": 0.458215995565921}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.021595409716524433, "res": {"No": 0.9784043407880455, "Yes": 0.021595409716524433}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9765150115231497, "res": {"Yes": 0.9765150115231497, "No": 0.023484317993835095}, "ground_truth": 1}, {"key": "39726411", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999458085984071, "res": {"Yes": 0.9999458085984071, "No": 5.359525606791706e-05}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999416367032035, "res": {"Yes": 0.9999416367032035, "No": 5.8042561358714474e-05}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.177251765607648e-06, "res": {"No": 0.9999919389784903, "Yes": 4.177251765607648e-06}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.984217149391775, "res": {"Yes": 0.984217149391775, "No": 0.015782603339768574}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9689054855312214, "res": {"Yes": 0.9689054855312214, "No": 0.031094367049877364}, "ground_truth": 1}, {"key": "37069841", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9709045279056603, "res": {"Yes": 0.9709045279056603, "No": 0.029094832438697094}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 2.2362927331989965e-05, "res": {"No": 0.9999739395305799, "Yes": 2.2362927331989965e-05}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9396932046715227, "res": {"Yes": 0.9396932046715227, "No": 0.060306547442953225}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998316352049432, "res": {"Yes": 0.9998316352049432, "No": 0.00016773201516353446}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, " Yes": 4.3032934621358076e-07}, "ground_truth": 1}, {"key": "38894693", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.3171595447255695e-06}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9893534688093388, "res": {"Yes": 0.9893534688093388, "No": 0.010645100921856008}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.02490473083959334, "res": {"No": 0.9750946263762579, "Yes": 0.02490473083959334}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 9.913504960456402e-05, "res": {"No": 0.9998976540877003, "Yes": 9.913504960456402e-05}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.853335611887107, "res": {"Yes": 0.853335611887107, "No": 0.1466633580122184}, "ground_truth": 1}, {"key": "33946032", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06620126549388893, "res": {"No": 0.9337981197445145, "Yes": 0.06620126549388893}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.010406975255580412, "res": {"No": 0.9895926165268032, "Yes": 0.010406975255580412}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.631173413487085e-05, "res": {"No": 0.9999130299021183, "Yes": 8.631173413487085e-05}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.21550186827205953, "res": {"No": 0.7844962868204871, "Yes": 0.21550186827205953}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.965498097111025, "res": {"Yes": 0.965498097111025, "No": 0.03450028479677188}, "ground_truth": 1}, {"key": "39035311", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.20021219497403053, "res": {"No": 0.799784118184708, "Yes": 0.20021219497403053}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8814231869195273, "res": {"Yes": 0.8814231869195273, "No": 0.11857311552840742}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.048375025524213994, "res": {"No": 0.9516246777377301, "Yes": 0.048375025524213994}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.003886811979132135, "res": {"No": 0.9961118981180153, "Yes": 0.003886811979132135}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997697881628126, "res": {"Yes": 0.9997697881628126, "No": 0.00022886185264629587}, "ground_truth": 1}, {"key": "27680038", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1393021031946325, "res": {"No": 0.8606976479913114, "Yes": 0.1393021031946325}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0007507359243959031, "res": {"No": 0.9992465214576283, "Yes": 0.0007507359243959031}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9819581368847204, "res": {"Yes": 0.9819581368847204, "No": 0.018041812467874462}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.09053796622049785, "res": {"No": 0.9094614207595434, "Yes": 0.09053796622049785}, "ground_truth": 1}, {"key": "36901907", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004304604565608377, "res": {"No": 0.9956952504109077, "Yes": 0.004304604565608377}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.6310855040468392, "res": {"Yes": 0.6310855040468392, "No": 0.3689144148202234}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.056690756853169696, "res": {"No": 0.9433091182896968, "Yes": 0.056690756853169696}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0004542383943732797, "res": {"No": 0.9995454778265137, "Yes": 0.0004542383943732797}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999828796125555, "res": {"Yes": 0.9999828796125555, "No": 1.697459064465467e-05}, "ground_truth": 1}, {"key": "21530542", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997932624931442, "res": {"Yes": 0.9997932624931442, "No": 0.00020650849673359812}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.3198935483303888, "res": {"No": 0.6801063948747148, "Yes": 0.3198935483303888}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.6656617051132295e-05, "res": {"No": 0.9999826412106655, "Yes": 1.6656617051132295e-05}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9923884139608736, "res": {"Yes": 0.9923884139608736, "No": 0.007610929291831424}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7115193398661033, "res": {"Yes": 0.7115193398661033, "No": 0.28847729393387855}, "ground_truth": 1}, {"key": "38192532", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9956999796758698, "res": {"Yes": 0.9956999796758698, "No": 0.004298815755119159}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.05034027633086029, "res": {"No": 0.9496593164197823, "Yes": 0.05034027633086029}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.5459722875108327, "res": {"Yes": 0.5459722875108327, "No": 0.4540259291075291}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999894357248024, "res": {"Yes": 0.9999894357248024, "No": 9.861828108439012e-06}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8807530665661544, "res": {"Yes": 0.8807530665661544, "No": 0.11924608260807718}, "ground_truth": 1}, {"key": "34102400", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 6.488495274837057e-07}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.23191007273047054, "res": {"No": 0.7680886521571452, "Yes": 0.23191007273047054}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.45782003901463375, "res": {"No": 0.5421794195183077, "Yes": 0.45782003901463375}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999860980626328, "res": {"Yes": 0.9999860980626328, "No": 1.3458428417999604e-05}, "ground_truth": 1}, {"key": "36133399", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998075640681697, "res": {"Yes": 0.9998075640681697, "No": 0.00019193035233514683}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0012886457735082524, "res": {"No": 0.998711310174808, "Yes": 0.0012886457735082524}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.8178008839376318e-05, "res": {"No": 0.9999772771531678, "Yes": 1.8178008839376318e-05}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974046510567169, "res": {"Yes": 0.9974046510567169, "No": 0.0025951524928156952}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8765913488750346, "res": {"Yes": 0.8765913488750346, "No": 0.12340853556602734}, "ground_truth": 1}, {"key": "34314544", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9752854193780551, "res": {"Yes": 0.9752854193780551, "No": 0.024714343386119164}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9962089084018817, "res": {"Yes": 0.9962089084018817, "No": 0.003790652163078714}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.4038664574159236e-05, "res": {"No": 0.9999621387467553, "Yes": 2.4038664574159236e-05}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8762645551883469, "res": {"Yes": 0.8762645551883469, "No": 0.12373530896684562}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9982353422426528, "res": {"Yes": 0.9982353422426528, "No": 0.0017645916061288097}, "ground_truth": 1}, {"key": "33460074", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9808727376482614, "res": {"Yes": 0.9808727376482614, "No": 0.01912710958987088}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994697456345629, "res": {"Yes": 0.9994697456345629, "No": 0.000530208623300902}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00011051343065535888, "res": {"No": 0.999888238005837, "Yes": 0.00011051343065535888}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 3.99238803932242e-06, "res": {"No": 0.9999950382530095, "Yes": 3.99238803932242e-06}, "ground_truth": 1}, {"key": "36191495", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.6321260090194233e-05, "res": {"No": 0.999974535534225, "Yes": 1.6321260090194233e-05}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00010390505588236788, "res": {"No": 0.9998949126820591, "Yes": 0.00010390505588236788}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0006534817185278626, "res": {"No": 0.9993463932939827, "Yes": 0.0006534817185278626}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3413345150487165, "res": {"No": 0.6586652896216557, "Yes": 0.3413345150487165}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.588847524888805, "res": {"Yes": 0.588847524888805, "No": 0.411152412456523}, "ground_truth": 1}, {"key": "39532668", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991277481330144, "res": {"Yes": 0.9991277481330144, "No": 0.0008718756913575172}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999961110815618, "res": {"Yes": 0.9999961110815618, "No": 3.567947705086793e-06}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999375840279578, "res": {"Yes": 0.9999375840279578, "No": 6.199371803926111e-05}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999979422771714, "res": {"Yes": 0.999979422771714, "No": 2.015597071629447e-05}, "ground_truth": 1}, {"key": "20328247", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07637216359899776, "res": {"No": 0.923627816019918, "Yes": 0.07637216359899776}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971359934144237, "res": {"Yes": 0.9971359934144237, "No": 0.0028626428712316705}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.03933990031340125, "res": {"No": 0.9606597989724236, "Yes": 0.03933990031340125}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8826854770174909, "res": {"Yes": 0.8826854770174909, "No": 0.11731385668413623}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999511724841019, "res": {"Yes": 0.9999511724841019, "No": 4.792597140323041e-05}, "ground_truth": 1}, {"key": "39112675", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998866885302296, "res": {"Yes": 0.9998866885302296, "No": 0.00011238118811913184}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.10191294607128634, "res": {"No": 0.8980865576139307, "Yes": 0.10191294607128634}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.5217368910430595e-05, "res": {"No": 0.9999434246564451, "Yes": 5.5217368910430595e-05}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.06037613910643826, "res": {"No": 0.9396226908598395, "Yes": 0.06037613910643826}, "ground_truth": 1}, {"key": "31620300", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.31000036626612937, "res": {"No": 0.6899995731598061, "Yes": 0.31000036626612937}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0007121472899779234, "res": {"No": 0.9992877027042486, "Yes": 0.0007121472899779234}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.06619630720479368, "res": {"No": 0.9338030035214518, "Yes": 0.06619630720479368}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9477678885574095, "res": {"Yes": 0.9477678885574095, "No": 0.05223178820477794}, "ground_truth": 1}, {"key": "37518509", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004211620451502058, "res": {"No": 0.9957881548044545, "Yes": 0.004211620451502058}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0014742194731446469, "res": {"No": 0.9985249134112778, "Yes": 0.0014742194731446469}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.5343352798289316e-05, "res": {"No": 0.9999430670627412, "Yes": 5.5343352798289316e-05}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999382992035725, "res": {"Yes": 0.9999382992035725, "No": 6.142067826183217e-05}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998131655857234, "res": {"Yes": 0.9998131655857234, "No": 0.00018668739955990174}, "ground_truth": 1}, {"key": "35454095", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999972151525776, "res": {"Yes": 0.999972151525776, "No": 2.743376510857527e-05}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.624680174114361e-07}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.3456468810727035, "res": {"No": 0.6543530770754465, "Yes": 0.3456468810727035}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.5118404108955558, "res": {"Yes": 0.5118404108955558, "No": 0.48815939371238215}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8300232305240283, "res": {"Yes": 0.8300232305240283, "No": 0.1699766677297266}, "ground_truth": 1}, {"key": "38542788", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.011339267240615363, "res": {"No": 0.9886597845348626, "Yes": 0.011339267240615363}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.06913139568138439, "res": {"No": 0.9308685257415814, "Yes": 0.06913139568138439}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.046023755339242e-06, "res": {"No": 0.9999893165220688, "Yes": 5.046023755339242e-06}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988867193572102, "res": {"Yes": 0.9988867193572102, "No": 0.001112854436564125}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998498667711213, "res": {"Yes": 0.9998498667711213, "No": 0.00014960254208821306}, "ground_truth": 1}, {"key": "23944937", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998315160150211, "res": {"Yes": 0.9998315160150211, "No": 0.00016761145918969803}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.6259337785867046e-06}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00021288701052947796, "res": {"No": 0.9997869460192236, "Yes": 0.00021288701052947796}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.059690822342950846, "res": {"No": 0.9403090887007934, "Yes": 0.059690822342950846}, "ground_truth": 1}, {"key": "31753944", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.992115419661731, "res": {"Yes": 0.992115419661731, "No": 0.007884551029584491}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.026577062732543e-07}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.078737596123475e-05, "res": {"No": 0.9999889589149532, "Yes": 1.078737596123475e-05}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 7.712978773994872e-05, "res": {"No": 0.9999223270267016, "Yes": 7.712978773994872e-05}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.01073054104534343, "res": {"No": 0.9892691122142706, "Yes": 0.01073054104534343}, "ground_truth": 1}, {"key": "35527214", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0059913800564136525, "res": {"No": 0.9940081705401898, "Yes": 0.0059913800564136525}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 7.508919330093896e-06, "res": {"No": 0.9999922965856715, "Yes": 7.508919330093896e-06}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0004836619720989942, "res": {"No": 0.9995161784993875, "Yes": 0.0004836619720989942}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.937169816514432e-06, "res": {"No": 0.9999909853566321, "Yes": 5.937169816514432e-06}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9019028137614562, "res": {"Yes": 0.9019028137614562, "No": 0.09809720540730718}, "ground_truth": 1}, {"key": "40400404", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.012442001653408898, "res": {"No": 0.9875578002707888, "Yes": 0.012442001653408898}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7199484260670865, "res": {"Yes": 0.7199484260670865, "No": 0.28005143395105025}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8094860571823469, "res": {"Yes": 0.8094860571823469, "No": 0.1905124561383444}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.14007641273784935, "res": {"No": 0.8599218293246633, "Yes": 0.14007641273784935}, "ground_truth": 1}, {"key": "21713119", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999398487531588, "res": {"Yes": 0.9999398487531588, "No": 5.9538642644977664e-05}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0003607396683798863, "res": {"No": 0.9996385012564222, "Yes": 0.0003607396683798863}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.033219497544555825, "res": {"No": 0.9667804091110299, "Yes": 0.033219497544555825}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9913432255313737, "res": {"Yes": 0.9913432255313737, "No": 0.008656639328745186}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.26373855196656065, "res": {"No": 0.7362610615151247, "Yes": 0.26373855196656065}, "ground_truth": 1}, {"key": "28730678", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.031003824845346053, "res": {"No": 0.9689961434762127, "Yes": 0.031003824845346053}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9783335959063441, "res": {"Yes": 0.9783335959063441, "No": 0.02166563314266744}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.6851651282501842e-06, "res": {"No": 0.9999974223173222, "Yes": 1.6851651282501842e-06}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 4.633310196821349e-06, "res": {"No": 0.9999931310055916, "Yes": 4.633310196821349e-06}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.08315067130119692, "res": {"No": 0.9168480168436423, "Yes": 0.08315067130119692}, "ground_truth": 1}, {"key": "36823733", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.021378896251468032, "res": {"No": 0.9786189264314128, "Yes": 0.021378896251468032}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 8.03940083950469e-06, "res": {"No": 0.9999909853566321, "Yes": 8.03940083950469e-06}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.722623114001075e-06, "res": {"No": 0.9999953958625991, "Yes": 3.722623114001075e-06}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.002540132586257632, "res": {"No": 0.9974596733047543, "Yes": 0.002540132586257632}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9738205739173521, "res": {"Yes": 0.9738205739173521, "No": 0.026178835500239573}, "ground_truth": 1}, {"key": "35988862", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0015475154029717022, "res": {"No": 0.9984513441070424, "Yes": 0.0015475154029717022}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.14828157188006902, "res": {"No": 0.851717823571951, "Yes": 0.14828157188006902}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.001612908835556751, "res": {"No": 0.9983858656184381, "Yes": 0.001612908835556751}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.303783665319633e-05, "res": {"No": 0.9999431862619615, "Yes": 5.303783665319633e-05}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9019228813223132, "res": {"Yes": 0.9019228813223132, "No": 0.09807694061809485}, "ground_truth": 1}, {"key": "40499665", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0029564265103159517, "res": {"No": 0.9970428460188641, "Yes": 0.0029564265103159517}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00025847695937497133, "res": {"No": 0.9997408397678161, "Yes": 0.00025847695937497133}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 4.8253798880691546e-05, "res": {"No": 0.9999515300767047, "Yes": 4.8253798880691546e-05}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5205097287184817, "res": {"Yes": 0.5205097287184817, "No": 0.47948858067979794}, "ground_truth": 1}, {"key": "32829820", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.16147644473355796, "res": {"No": 0.8385220760828807, "Yes": 0.16147644473355796}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0001697506436126685, "res": {"No": 0.9998292515191815, "Yes": 0.0001697506436126685}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.07030956708656651, "res": {"No": 0.9296901782551269, "Yes": 0.07030956708656651}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999756083404814, "res": {"Yes": 0.9999756083404814, "No": 2.357362631168324e-05}, "ground_truth": 1}, {"key": "20583553", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9971799676824955, "res": {"Yes": 0.9971799676824955, "No": 0.00281852099915082}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991823687827167, "res": {"Yes": 0.9991823687827167, "No": 0.0008171114979636959}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.002292660145506977, "res": {"No": 0.9977064286634229, "Yes": 0.002292660145506977}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 8.008452592527673e-06, "res": {"No": 0.9999912237625114, "Yes": 8.008452592527673e-06}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.022800671310778377, "res": {"No": 0.9771989149163071, "Yes": 0.022800671310778377}, "ground_truth": 1}, {"key": "30501550", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0008765761304890718, "res": {"No": 0.9991220350069981, "Yes": 0.0008765761304890718}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.3307669963137964e-05, "res": {"No": 0.9999814491960682, "Yes": 1.3307669963137964e-05}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00015645157825199644, "res": {"No": 0.999839382170425, "Yes": 0.00015645157825199644}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.7792560784345145, "res": {"Yes": 0.7792560784345145, "No": 0.22074206186192902}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 2.5623798741116025e-05, "res": {"No": 0.9999735819309633, "Yes": 2.5623798741116025e-05}, "ground_truth": 1}, {"key": "38755897", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00010695343554969397, "res": {"No": 0.9998922904870862, "Yes": 0.00010695343554969397}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.09472668821133227, "res": {"No": 0.9052726083003263, "Yes": 0.09472668821133227}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.000451215006160062, "res": {"No": 0.9995470267933546, "Yes": 0.000451215006160062}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.027391114678099994, "res": {"No": 0.9726087155197604, "Yes": 0.027391114678099994}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.030846740210494585, "res": {"No": 0.9691529794719739, "Yes": 0.030846740210494585}, "ground_truth": 1}, {"key": "35507201", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3042166095169712, "res": {"No": 0.6957825052086398, "Yes": 0.3042166095169712}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988204686945596, "res": {"Yes": 0.9988204686945596, "No": 0.001179503136432134}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.02501659936118611, "res": {"No": 0.9749825378910564, "Yes": 0.02501659936118611}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9858039971420691, "res": {"Yes": 0.9858039971420691, "No": 0.014195722388547676}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997338827713531, "res": {"Yes": 0.997338827713531, "No": 0.002661073409983877}, "ground_truth": 1}, {"key": "36453511", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999956774797236, "res": {"Yes": 0.999956774797236, "No": 4.303116230392287e-05}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9880029355838191, "res": {"Yes": 0.9880029355838191, "No": 0.01199689995082799}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.6881374552098365e-06, "res": {"No": 0.9999963494876631, "Yes": 2.6881374552098365e-06}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 3.327354237673189e-05, "res": {"No": 0.9999628539429318, "Yes": 3.327354237673189e-05}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 6.168325856085549e-05, "res": {"No": 0.9999380608083109, "Yes": 6.168325856085549e-05}, "ground_truth": 1}, {"key": "38066835", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.8706679469367214e-06, "res": {"No": 0.9999976607241361, "Yes": 1.8706679469367214e-06}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 4.7366420906743446e-05, "res": {"No": 0.9999477157538689, "Yes": 4.7366420906743446e-05}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0003213017002734817, "res": {"No": 0.9996786518433829, "Yes": 0.0003213017002734817}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9719993570433031, "res": {"Yes": 0.9719993570433031, "No": 0.027999545530282433}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 3.6373563887358474e-07}, "ground_truth": 1}, {"key": "39697181", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 1.8969921597368224e-06}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.15992791444313206, "res": {"No": 0.8400715686502923, "Yes": 0.15992791444313206}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.3331738662281831e-05, "res": {"No": 0.9999864556687252, "Yes": 1.3331738662281831e-05}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.059962884490014204, "res": {"No": 0.9400370214240181, "Yes": 0.059962884490014204}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9898026808416455, "res": {"Yes": 0.9898026808416455, "No": 0.010197031810611308}, "ground_truth": 1}, {"key": "21820893", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.005158172133187711, "res": {"No": 0.9948417337827944, "Yes": 0.005158172133187711}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 8.326777761252816e-06, "res": {"No": 0.9999913429644723, "Yes": 8.326777761252816e-06}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.90279016737266e-05, "res": {"No": 0.9999490269261713, "Yes": 4.90279016737266e-05}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999915813694369, "res": {"Yes": 0.9999915813694369, "No": 7.340761310058902e-06}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.023895906759622686, "res": {"No": 0.976103666044453, "Yes": 0.023895906759622686}, "ground_truth": 1}, {"key": "40519933", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3097467347791864, "res": {"No": 0.6902521178088844, "Yes": 0.3097467347791864}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9748271984994966, "res": {"Yes": 0.9748271984994966, "No": 0.025170641083908863}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.090370408931345, "res": {"No": 0.909629262799167, "Yes": 0.090370408931345}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.488443506587088e-07}, "ground_truth": 1}, {"key": "30446033", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 7.04877430281456e-08}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9926210438679534, "res": {"Yes": 0.9926210438679534, "No": 0.007378610036839385}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00026597506345149406, "res": {"No": 0.9997338122342516, "Yes": 0.00026597506345149406}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 1.8842326408933654e-07}, "ground_truth": 1}, {"key": "40216291", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.05933145352636305, "res": {"No": 0.9406680073410185, "Yes": 0.05933145352636305}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.02509442422379451, "res": {"No": 0.9749053642527618, "Yes": 0.02509442422379451}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.9113082714291315e-06, "res": {"No": 0.9999964686909351, "Yes": 2.9113082714291315e-06}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8610046275037792, "res": {"Yes": 0.8610046275037792, "No": 0.13899396000458325}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9183864752056086, "res": {"Yes": 0.9183864752056086, "No": 0.08161287072312469}, "ground_truth": 1}, {"key": "33479118", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6401477051239444, "res": {"Yes": 0.6401477051239444, "No": 0.3598513678026418}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.04187415785351377, "res": {"No": 0.9581257333070542, "Yes": 0.04187415785351377}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 4.4981107035883834e-05, "res": {"No": 0.9999542716355735, "Yes": 4.4981107035883834e-05}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.48763826902014307, "res": {"No": 0.5123600696908029, "Yes": 0.48763826902014307}, "ground_truth": 1}, {"key": "22297373", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999645227323332, "res": {"Yes": 0.9999645227323332, "No": 3.4802650858156036e-05}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.006674484540998118, "res": {"No": 0.993324534575427, "Yes": 0.006674484540998118}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.2966376164824385e-05, "res": {"No": 0.9999865748701179, "Yes": 1.2966376164824385e-05}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.008480869492005586, "res": {"No": 0.9915189943695342, "Yes": 0.008480869492005586}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3346162252910643, "res": {"No": 0.6653825969552558, "Yes": 0.3346162252910643}, "ground_truth": 1}, {"key": "36463668", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7662927209552999, "res": {"Yes": 0.7662927209552999, "No": 0.23370608502832171}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.029308725753740744, "res": {"No": 0.9706901690564051, "Yes": 0.029308725753740744}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00021939166517933825, "res": {"No": 0.9997787264246095, "Yes": 0.00021939166517933825}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.4956014968711208e-05, "res": {"No": 0.9999847868417213, "Yes": 1.4956014968711208e-05}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6337703209344209, "res": {"Yes": 0.6337703209344209, "No": 0.3662290945525387}, "ground_truth": 1}, {"key": "35264615", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9622054698500365, "res": {"Yes": 0.9622054698500365, "No": 0.03779435976711781}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 3.0213249639876262e-05, "res": {"No": 0.9999696483206215, "Yes": 3.0213249639876262e-05}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.1676778188013056e-05, "res": {"No": 0.99997334352929, "Yes": 2.1676778188013056e-05}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00021013066635663298, "res": {"No": 0.999789806303791, "Yes": 0.00021013066635663298}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.04007443416449198, "res": {"No": 0.9599253480421552, "Yes": 0.04007443416449198}, "ground_truth": 1}, {"key": "39898482", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.006136451104113066, "res": {"No": 0.9938627254815033, "Yes": 0.006136451104113066}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0037424436446261205, "res": {"No": 0.996257296041387, "Yes": 0.0037424436446261205}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.02909301406849434, "res": {"No": 0.970906775552244, "Yes": 0.02909301406849434}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3447217186660168, "res": {"No": 0.655278265983839, "Yes": 0.3447217186660168}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999956342685299, "res": {"Yes": 0.9999956342685299, "No": 4.273373482086272e-06}, "ground_truth": 1}, {"key": "37228721", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999953079650794, "res": {"Yes": 0.999953079650794, "No": 4.6611465794734053e-05}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.057111441834699836, "res": {"No": 0.9428885122577361, "Yes": 0.057111441834699836}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.990761313440404e-05, "res": {"No": 0.9999284059529762, "Yes": 6.990761313440404e-05}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9917700827319319, "res": {"Yes": 0.9917700827319319, "No": 0.008229208018241771}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999367496503877, "res": {"Yes": 0.9999367496503877, "No": 6.303288396828296e-05}, "ground_truth": 1}, {"key": "24535799", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9854101810795338, "res": {"Yes": 0.9854101810795338, "No": 0.014589040249536438}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7239090978029227, "res": {"Yes": 0.7239090978029227, "No": 0.27609085021032104}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.021446771655813e-06, "res": {"No": 0.9999899125338788, "Yes": 6.021446771655813e-06}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998689366795475, "res": {"Yes": 0.9998689366795475, "No": 0.00013093219031023407}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999978707566687, "res": {"Yes": 0.999978707566687, "No": 2.1133121688058307e-05}, "ground_truth": 1}, {"key": "35177759", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.22585842817494778, "res": {"No": 0.7741411482021964, "Yes": 0.22585842817494778}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9960153979777724, "res": {"Yes": 0.9960153979777724, "No": 0.003984318490740773}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00022539255208628176, "res": {"No": 0.9997731251000034, "Yes": 0.00022539255208628176}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.04970659293746715, "res": {"No": 0.9502924354186616, "Yes": 0.04970659293746715}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0006850796151222366, "res": {"No": 0.9993144864718347, "Yes": 0.0006850796151222366}, "ground_truth": 1}, {"key": "34364829", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7538721105617195, "res": {"Yes": 0.7538721105617195, "No": 0.24612742237979385}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.44428190360313813, "res": {"No": 0.5557174485294416, "Yes": 0.44428190360313813}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.805265574306319, "res": {"Yes": 0.805265574306319, "No": 0.19473420529207128}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9735558796955895, "res": {"Yes": 0.9735558796955895, "No": 0.026442571785193377}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985886193358373, "res": {"Yes": 0.9985886193358373, "No": 0.0014106693089807607}, "ground_truth": 1}, {"key": "38090732", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998212662747757, "res": {"Yes": 0.9998212662747757, "No": 0.00017824527620049775}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.37833898481852146, "res": {"No": 0.6216589552952934, "Yes": 0.37833898481852146}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.06661280184585103, "res": {"No": 0.9333869749292377, "Yes": 0.06661280184585103}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9936135029199348, "res": {"Yes": 0.9936135029199348, "No": 0.006385847917238405}, "ground_truth": 1}, {"key": "30651479", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992181947690878, "res": {"Yes": 0.9992181947690878, "No": 0.0007811651271993042}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997621609181999, "res": {"Yes": 0.9997621609181999, "No": 0.00023693374805040343}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.5488604660374575, "res": {"Yes": 0.5488604660374575, "No": 0.4511359696975237}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9965737865106862, "res": {"Yes": 0.9965737865106862, "No": 0.003422655387771055}, "ground_truth": 1}, {"key": "39380921", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9954718137900199, "res": {"Yes": 0.9954718137900199, "No": 0.004525822275484089}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.10219326536582544, "res": {"No": 0.8978057842157121, "Yes": 0.10219326536582544}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.866482183605459e-06, "res": {"No": 0.9999949190499081, "Yes": 2.866482183605459e-06}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9589816076100257, "res": {"Yes": 0.9589816076100257, "No": 0.04101728154446276}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998862117703717, "res": {"Yes": 0.9998862117703717, "No": 0.00011316507098645603}, "ground_truth": 1}, {"key": "39037490", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994293760977794, "res": {"Yes": 0.9994293760977794, "No": 0.0005696523474300349}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998565412111963, "res": {"Yes": 0.9998565412111963, "No": 0.00014276195002102686}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.03458238260005751, "res": {"No": 0.9654172062417267, "Yes": 0.03458238260005751}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.23304905758578284, "res": {"No": 0.7669507200038093, "Yes": 0.23304905758578284}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.03100617192372264, "res": {"No": 0.9689921192435851, "Yes": 0.03100617192372264}, "ground_truth": 1}, {"key": "35917499", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.032963051378327834, "res": {"No": 0.9670365160878382, "Yes": 0.032963051378327834}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.018207858361214753, "res": {"No": 0.9817920615489597, "Yes": 0.018207858361214753}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.995030698683801e-06, "res": {"No": 0.9999947998470209, "Yes": 4.995030698683801e-06}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986623213907058, "res": {"Yes": 0.9986623213907058, "No": 0.0013375442441539015}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9935876106830266, "res": {"Yes": 0.9935876106830266, "No": 0.006412336922485325}, "ground_truth": 1}, {"key": "34908073", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998801678860878, "res": {"Yes": 0.998801678860878, "No": 0.0011980639500948674}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9592027809826956, "res": {"Yes": 0.9592027809826956, "No": 0.040796866581267084}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.02814965444388068, "res": {"No": 0.971849709823186, "Yes": 0.02814965444388068}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.984150638244256, "res": {"Yes": 0.984150638244256, "No": 0.015845749261837568}, "ground_truth": 1}, {"key": "36344759", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990046048347628, "res": {"Yes": 0.9990046048347628, "No": 0.000992214047763611}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0008135560775494923, "res": {"No": 0.9991860574311089, "Yes": 0.0008135560775494923}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0007004623086411962, "res": {"No": 0.9992992463026356, "Yes": 0.0007004623086411962}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.1353756416278812e-06, "res": {"No": 0.9999978991308068, "Yes": 1.1353756416278812e-06}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.982244900705156, "res": {"Yes": 0.982244900705156, "No": 0.01775336151259075}, "ground_truth": 1}, {"key": "39984637", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.992545173098119, "res": {"Yes": 0.992545173098119, "No": 0.0074542592391613465}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9950284174302231, "res": {"Yes": 0.9950284174302231, "No": 0.0049711225459542745}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0006501977568752932, "res": {"No": 0.9993480610745897, "Yes": 0.0006501977568752932}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.08104619323577768, "res": {"No": 0.9189522928480378, "Yes": 0.08104619323577768}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995479799918402, "res": {"Yes": 0.9995479799918402, "No": 0.00045034963960058653}, "ground_truth": 1}, {"key": "17917326", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9953333806625403, "res": {"Yes": 0.9953333806625403, "No": 0.004664760900073024}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.017270295091963782, "res": {"No": 0.982725638597887, "Yes": 0.017270295091963782}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.7537345767656033e-06, "res": {"No": 0.9999976607241361, "Yes": 1.7537345767656033e-06}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998986076205548, "res": {"Yes": 0.9998986076205548, "No": 0.00010119765229965612}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991673725267863, "res": {"Yes": 0.9991673725267863, "No": 0.0008324206133466745}, "ground_truth": 1}, {"key": "32193638", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999968263007362, "res": {"Yes": 0.9999968263007362, "No": 3.000987970533749e-06}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7584832223123681, "res": {"Yes": 0.7584832223123681, "No": 0.24151659304232992}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.2789844035438024, "res": {"No": 0.7210155461512726, "Yes": 0.2789844035438024}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.030309957199655832, "res": {"No": 0.9696897044313417, "Yes": 0.030309957199655832}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999856212553752, "res": {"Yes": 0.9999856212553752, "No": 1.405307956614238e-05}, "ground_truth": 1}, {"key": "34564692", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9388079375925024, "res": {"Yes": 0.9388079375925024, "No": 0.061191285095749864}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.03381373155399738, "res": {"No": 0.9661860103579801, "Yes": 0.03381373155399738}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00011022431955234243, "res": {"No": 0.999887165296314, "Yes": 0.00011022431955234243}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9969840693836133, "res": {"Yes": 0.9969840693836133, "No": 0.0030149048746416778}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999765619466755, "res": {"Yes": 0.9999765619466755, "No": 2.294946346872635e-05}, "ground_truth": 1}, {"key": "39329284", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 1.6930837290692613e-06}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.001038369068616497, "res": {"No": 0.9989570158864183, "Yes": 0.001038369068616497}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.025435798689532583, "res": {"No": 0.9745635424286984, "Yes": 0.025435798689532583}, "ground_truth": 1}, {"key": "37438541", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9782335390197183, "res": {"Yes": 0.9782335390197183, "No": 0.02176505449914671}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9710625486792839, "res": {"Yes": 0.9710625486792839, "No": 0.028936514612016594}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.0627075723741666e-05, "res": {"No": 0.9999837140256179, "Yes": 1.0627075723741666e-05}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.016783785624845518, "res": {"No": 0.983216089934496, "Yes": 0.016783785624845518}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9923211526498643, "res": {"Yes": 0.9923211526498643, "No": 0.007678416023764797}, "ground_truth": 1}, {"key": "34652757", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.38906853436298894, "res": {"No": 0.6109313395623498, "Yes": 0.38906853436298894}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999160097413793, "res": {"Yes": 0.9999160097413793, "No": 8.371067916645429e-05}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.924761992485049, "res": {"Yes": 0.924761992485049, "No": 0.07523794406117973}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9865821803717816, "res": {"Yes": 0.9865821803717816, "No": 0.013417743582342554}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.08424285672425372, "res": {"No": 0.915757063502974, "Yes": 0.08424285672425372}, "ground_truth": 1}, {"key": "31361004", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.002463878363480389, "res": {"No": 0.997536065482047, "Yes": 0.002463878363480389}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9959854842997256, "res": {"Yes": 0.9959854842997256, "No": 0.0040145420414272}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.169784352473345e-06, "res": {"No": 0.9999955150656573, "Yes": 3.169784352473345e-06}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.01329567745450717, "res": {"No": 0.9867033341823664, "Yes": 0.01329567745450717}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6537890716229829, "res": {"Yes": 0.6537890716229829, "No": 0.3462102948393619}, "ground_truth": 1}, {"key": "26150727", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9909098207766025, "res": {"Yes": 0.9909098207766025, "No": 0.009089689770800059}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9968342034352736, "res": {"Yes": 0.9968342034352736, "No": 0.0031647807471113184}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0007775823524267696, "res": {"No": 0.999222244508716, "Yes": 0.0007775823524267696}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8979189956843109, "res": {"Yes": 0.8979189956843109, "No": 0.10207991419012398}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9428712330411905, "res": {"Yes": 0.9428712330411905, "No": 0.05712848071902239}, "ground_truth": 1}, {"key": "36997402", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9926670922292042, "res": {"Yes": 0.9926670922292042, "No": 0.007332679333971624}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997560829925914, "res": {"Yes": 0.9997560829925914, "No": 0.00024337404944528235}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999813299942867, "res": {"Yes": 0.9999813299942867, "No": 1.810412038535678e-05}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, " Yes": 1.3069832918321148e-07}, "ground_truth": 1}, {"key": "37430643", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, " Yes": 1.3405669894942794e-07}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9835645857655568, "res": {"Yes": 0.9835645857655568, "No": 0.01643506034722775}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.1132730503760657, "res": {"No": 0.8867266258692824, "Yes": 0.1132730503760657}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 8.365069567975173e-07}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9981031530923066, "res": {"Yes": 0.9981031530923066, "No": 0.0018965654243766452}, "ground_truth": 1}, {"key": "36964631", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.4681947104809473e-06}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999994561441089, "res": {"Yes": 0.999994561441089, "No": 4.954749234699058e-06}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 7.717600232269062e-05, "res": {"No": 0.9999225654082128, "Yes": 7.717600232269062e-05}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.014397314253053371, "res": {"No": 0.9856025893745616, "Yes": 0.014397314253053371}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.012096828115001694, "res": {"No": 0.9879031049071143, "Yes": 0.012096828115001694}, "ground_truth": 1}, {"key": "35502013", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998282980724635, "res": {"Yes": 0.9998282980724635, "No": 0.00017146901126799505}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0002777503137033965, "res": {"No": 0.9997221371310395, "Yes": 0.0002777503137033965}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.004415112340778478, "res": {"No": 0.9955845255977688, "Yes": 0.004415112340778478}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9782792803329137, "res": {"Yes": 0.9782792803329137, "No": 0.02172061867947542}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7391143306902167, "res": {"Yes": 0.7391143306902167, "No": 0.2608856735497726}, "ground_truth": 1}, {"key": "33987664", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975162551112672, "res": {"Yes": 0.9975162551112672, "No": 0.002483002662909942}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9924778867714843, "res": {"Yes": 0.9924778867714843, "No": 0.0075215022024940565}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00251388981081348, "res": {"No": 0.9974855317845012, "Yes": 0.00251388981081348}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7087702662448437, "res": {"Yes": 0.7087702662448437, "No": 0.29122736321201725}, "ground_truth": 1}, {"key": "35203721", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0016802477940250807, "res": {"No": 0.9983183794110269, "Yes": 0.0016802477940250807}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0009579873353174044, "res": {"No": 0.9990392188460586, "Yes": 0.0009579873353174044}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0005009997278966578, "res": {"No": 0.9994989207821441, "Yes": 0.0005009997278966578}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9828837433709894, "res": {"Yes": 0.9828837433709894, "No": 0.01711608524521051}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999943230348141, "res": {"Yes": 0.9999943230348141, "No": 5.5134168997630784e-06}, "ground_truth": 1}, {"key": "39028348", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997176086499453, "res": {"Yes": 0.9997176086499453, "No": 0.00028218095737607635}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983579459484203, "res": {"Yes": 0.9983579459484203, "No": 0.0016418603833130512}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.5421430988075773e-05, "res": {"No": 0.9999675027220479, "Yes": 2.5421430988075773e-05}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999884821053314, "res": {"Yes": 0.9999884821053314, "No": 1.1063247270897279e-05}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999404447334853, "res": {"Yes": 0.9999404447334853, "No": 5.903943190049152e-05}, "ground_truth": 1}, {"key": "37459383", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9747544752039378, "res": {"Yes": 0.9747544752039378, "No": 0.02524482486774338}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7355743693854858, "res": {"Yes": 0.7355743693854858, "No": 0.264424952871013}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.43677995161376e-05, "res": {"No": 0.9999853828508316, "Yes": 1.43677995161376e-05}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0004090508835508224, "res": {"No": 0.9995907410093171, "Yes": 0.0004090508835508224}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9940775512527021, "res": {"Yes": 0.9940775512527021, "No": 0.0059217675619325175}, "ground_truth": 1}, {"key": "34020070", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.31173166790007595, "res": {"No": 0.6882671272864261, "Yes": 0.31173166790007595}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.1297899116497018, "res": {"No": 0.8702093796714242, "Yes": 0.1297899116497018}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.503141849878877e-05, "res": {"No": 0.9999046864026295, "Yes": 9.503141849878877e-05}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999938462231346, "res": {"Yes": 0.9999938462231346, "No": 5.6256447174848614e-06}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999757275415809, "res": {"Yes": 0.9999757275415809, "No": 2.3636131995157824e-05}, "ground_truth": 1}, {"key": "35176615", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9650905546791574, "res": {"Yes": 0.9650905546791574, "No": 0.03490913626275926}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.016915414029284228, "res": {"No": 0.9830846240521052, "Yes": 0.016915414029284228}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0025960308410274005, "res": {"No": 0.9974038187228829, "Yes": 0.0025960308410274005}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 9.995054942844578e-05, "res": {"No": 0.9998995611443197, "Yes": 9.995054942844578e-05}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992168844951281, "res": {"Yes": 0.9992168844951281, "No": 0.0007826463690055256}, "ground_truth": 1}, {"key": "33296389", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.18354494676172295, "res": {"No": 0.8164546582147295, "Yes": 0.18354494676172295}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.022708465375110017, "res": {"No": 0.9772912450313943, "Yes": 0.022708465375110017}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 1.6981181221998636e-07}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999955150656573, "res": {"Yes": 0.9999955150656573, "No": 4.397840205230864e-06}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999980183344636, "res": {"Yes": 0.9999980183344636, "No": 1.8197034676731457e-06}, "ground_truth": 1}, {"key": "35399504", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996189700903411, "res": {"Yes": 0.9996189700903411, "No": 0.00038070091161610713}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9962453381364532, "res": {"Yes": 0.9962453381364532, "No": 0.003753450607835372}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.4223292032533986e-06, "res": {"No": 0.9999974223173222, "Yes": 2.4223292032533986e-06}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0007254884542237152, "res": {"No": 0.9992744880111876, "Yes": 0.0007254884542237152}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999413983091462, "res": {"Yes": 0.9999413983091462, "No": 5.7449859458485255e-05}, "ground_truth": 1}, {"key": "34807886", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999911045595646, "res": {"Yes": 0.9999911045595646, "No": 8.454658218722292e-06}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9876325676455474, "res": {"Yes": 0.9876325676455474, "No": 0.012366946132213476}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.6036151790046297e-06, "res": {"No": 0.9999958726752174, "Yes": 3.6036151790046297e-06}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.14776538492926983, "res": {"No": 0.8522340357719469, "Yes": 0.14776538492926983}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9952812962295313, "res": {"Yes": 0.9952812962295313, "No": 0.004718080197229805}, "ground_truth": 1}, {"key": "37629813", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987158304522985, "res": {"Yes": 0.9987158304522985, "No": 0.0012838575785485348}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.5854462511926427, "res": {"Yes": 0.5854462511926427, "No": 0.41455326849915847}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999974223173222, "res": {"Yes": 0.9999974223173222, "No": 2.312641916836611e-06}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999882437011058, "res": {"Yes": 0.9999882437011058, "No": 1.1416407304913483e-05}, "ground_truth": 1}, {"key": "28084389", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1758545581020012, "res": {"No": 0.8241449700670023, "Yes": 0.1758545581020012}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8041416208332078, "res": {"Yes": 0.8041416208332078, "No": 0.19585826874029483}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.088592478830137e-06, "res": {"No": 0.9999977799274644, "Yes": 1.088592478830137e-06}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.7340928370962865e-06, "res": {"No": 0.9999934886141991, "Yes": 5.7340928370962865e-06}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.13952869499289922, "res": {"No": 0.8604712798552263, "Yes": 0.13952869499289922}, "ground_truth": 1}, {"key": "35391734", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.04209338822141123, "res": {"No": 0.9579059184927975, "Yes": 0.04209338822141123}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.978135323433799, "res": {"Yes": 0.978135323433799, "No": 0.02186438547350968}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3410292596344747, "res": {"No": 0.6589705265411889, "Yes": 0.3410292596344747}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00036417665213070915, "res": {"No": 0.9996357605513003, "Yes": 0.00036417665213070915}, "ground_truth": 1}, {"key": "40214591", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9041965279886459, "res": {"Yes": 0.9041965279886459, "No": 0.09580280640681511}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.10726166097979888, "res": {"No": 0.8927383072902141, "Yes": 0.10726166097979888}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0314284639960007, "res": {"No": 0.9685714431997718, "Yes": 0.0314284639960007}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998850198707218, "res": {"Yes": 0.9998850198707218, "No": 0.00011478933259989384}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 1.1551967213182022e-07}, "ground_truth": 1}, {"key": "26283171", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 5.534563221589832e-07}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998349723485612, "res": {"Yes": 0.9998349723485612, "No": 0.00016479743581252008}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.6285457256364999, "res": {"Yes": 0.6285457256364999, "No": 0.37145325517336947}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9949361272526288, "res": {"Yes": 0.9949361272526288, "No": 0.00506367385922909}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.17349702963519822, "res": {"No": 0.8265027454070143, "Yes": 0.17349702963519822}, "ground_truth": 1}, {"key": "37084030", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996120625871847, "res": {"Yes": 0.9996120625871847, "No": 0.0003874595894109766}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.09876575930845341, "res": {"No": 0.9012337149047923, "Yes": 0.09876575930845341}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00012798967005456572, "res": {"No": 0.9998716780239691, "Yes": 0.00012798967005456572}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.12986882193640936, "res": {"No": 0.8701307685069845, "Yes": 0.12986882193640936}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.028736620326771857, "res": {"No": 0.9712620050158395, "Yes": 0.028736620326771857}, "ground_truth": 1}, {"key": "39027295", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.05258033965109256, "res": {"No": 0.9474190358186187, "Yes": 0.05258033965109256}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.046272284686849546, "res": {"No": 0.9537258831944023, "Yes": 0.046272284686849546}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00011617533493222164, "res": {"No": 0.9998818017459641, "Yes": 0.00011617533493222164}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999964686909351, "res": {"Yes": 0.9999964686909351, "No": 2.81720866029784e-06}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, " Yes": 3.90130905115368e-07}, "ground_truth": 1}, {"key": "14018647", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986147708168867, "res": {"Yes": 0.9986147708168867, "No": 0.001383874645430018}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999968263007362, "res": {"Yes": 0.9999968263007362, "No": 2.2216708722894507e-06}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.005101136096706436, "res": {"No": 0.9948950710655198, "Yes": 0.005101136096706436}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.565802488807494e-05, "res": {"No": 0.999983356420506, "Yes": 1.565802488807494e-05}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0003334475421110819, "res": {"No": 0.9996661395438096, "Yes": 0.0003334475421110819}, "ground_truth": 1}, {"key": "37424289", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0009542937689576824, "res": {"No": 0.9990444514275743, "Yes": 0.0009542937689576824}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0004183606493279424, "res": {"No": 0.9995810931659792, "Yes": 0.0004183606493279424}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.4977761853746728e-05, "res": {"No": 0.999984906043415, "Yes": 1.4977761853746728e-05}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9877744512544359, "res": {"Yes": 0.9877744512544359, "No": 0.012224529879808805}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.994240614219246, "res": {"Yes": 0.994240614219246, "No": 0.005758434093511468}, "ground_truth": 1}, {"key": "37498031", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999988005296937, "res": {"Yes": 0.999988005296937, "No": 1.1799610919028053e-05}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995743013953742, "res": {"Yes": 0.9995743013953742, "No": 0.00042542937709559646}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00028743638263606836, "res": {"No": 0.9997117693464384, "Yes": 0.00028743638263606836}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999304322739465, "res": {"Yes": 0.9999304322739465, "No": 6.917323829368296e-05}, "ground_truth": 1}, {"key": "30104095", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999566555993957, "res": {"Yes": 0.9999566555993957, "No": 4.317175914413457e-05}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8370980004351175, "res": {"Yes": 0.8370980004351175, "No": 0.1629015578810963}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.0236488603176787e-06, "res": {"No": 0.9999982567412194, "Yes": 1.0236488603176787e-06}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9576420651685527, "res": {"Yes": 0.9576420651685527, "No": 0.04235785063395649}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.29890122838953614, "res": {"No": 0.7010985618835717, "Yes": 0.29890122838953614}, "ground_truth": 1}, {"key": "37911407", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.002688263050661853, "res": {"No": 0.9973116836117818, "Yes": 0.002688263050661853}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993865175173773, "res": {"Yes": 0.9993865175173773, "No": 0.0006134314720820317}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.27898359449020527, "res": {"No": 0.7210162094858802, "Yes": 0.27898359449020527}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8211275108148195, "res": {"Yes": 0.8211275108148195, "No": 0.1788723600222319}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994190187350116, "res": {"Yes": 0.9994190187350116, "No": 0.0005805604661866119}, "ground_truth": 1}, {"key": "39177472", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9967206099843837, "res": {"Yes": 0.9967206099843837, "No": 0.0032790799466658432}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978131149251281, "res": {"Yes": 0.9978131149251281, "No": 0.0021867081365246543}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.329664371277201e-06, "res": {"No": 0.9999983759447187, "Yes": 1.329664371277201e-06}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.2129875000938805, "res": {"No": 0.7870124902335588, "Yes": 0.2129875000938805}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997236863416524, "res": {"Yes": 0.9997236863416524, "No": 0.00027620671643404575}, "ground_truth": 1}, {"key": "32325454", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9891364769361642, "res": {"Yes": 0.9891364769361642, "No": 0.010863403671480148}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9838885141270821, "res": {"Yes": 0.9838885141270821, "No": 0.016111483505990218}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.053432628447305675, "res": {"No": 0.9465669817574222, "Yes": 0.053432628447305675}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999963211539712, "res": {"Yes": 0.999963211539712, "No": 3.6566135698797185e-05}, "ground_truth": 1}, {"key": "38395319", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999958726752174, "res": {"Yes": 0.9999958726752174, "No": 3.852766870963059e-06}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 9.860636733389334e-08}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.007674117314542409, "res": {"No": 0.9923254893012416, "Yes": 0.007674117314542409}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9571731920251558, "res": {"Yes": 0.9571731920251558, "No": 0.042825695259752584}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.98277296780432, "res": {"Yes": 0.98277296780432, "No": 0.01722648248316148}, "ground_truth": 1}, {"key": "38235895", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999177976487984, "res": {"Yes": 0.9999177976487984, "No": 8.175316772565139e-05}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9853180485495017, "res": {"Yes": 0.9853180485495017, "No": 0.014681345568745514}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00010691568764984118, "res": {"No": 0.9998888339594022, "Yes": 0.00010691568764984118}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.01574401477846267, "res": {"No": 0.984255608428276, "Yes": 0.01574401477846267}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9926287985516252, "res": {"Yes": 0.9926287985516252, "No": 0.007370957224552535}, "ground_truth": 1}, {"key": "26543267", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999886013079656, "res": {"Yes": 0.9999886013079656, "No": 1.102211333433329e-05}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977091567956112, "res": {"Yes": 0.9977091567956112, "No": 0.002290580500206709}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.257055982196767e-05, "res": {"No": 0.999979303571174, "Yes": 1.257055982196767e-05}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.20359839040701713, "res": {"No": 0.7964003239692911, "Yes": 0.20359839040701713}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9669671810883224, "res": {"Yes": 0.9669671810883224, "No": 0.033030794036852974}, "ground_truth": 1}, {"key": "39054728", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9952719671035521, "res": {"Yes": 0.9952719671035521, "No": 0.004726709426868763}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00011772184051938239, "res": {"No": 0.9998815633641722, "Yes": 0.00011772184051938239}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00031362172366382834, "res": {"No": 0.9996861555994607, "Yes": 0.00031362172366382834}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 9.554932926734738e-06, "res": {"No": 0.9999902701413353, "Yes": 9.554932926734738e-06}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0038139075947795226, "res": {"No": 0.9961852421464444, "Yes": 0.0038139075947795226}, "ground_truth": 1}, {"key": "39158443", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7112684170199003, "res": {"Yes": 0.7112684170199003, "No": 0.28873109244501316}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 3.630333647498165e-06, "res": {"No": 0.9999957534720165, "Yes": 3.630333647498165e-06}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.5067084652544005, "res": {"Yes": 0.5067084652544005, "No": 0.4932910766499565}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 2.5411980700815083e-07}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999812107925193, "res": {"Yes": 0.9999812107925193, "No": 1.8616179309510635e-05}, "ground_truth": 1}, {"key": "36254201", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999957534720165, "res": {"Yes": 0.9999957534720165, "No": 3.8872406364364645e-06}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995166550788102, "res": {"Yes": 0.9995166550788102, "No": 0.0004828916290419945}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999869324773808, "res": {"Yes": 0.9999869324773808, "No": 1.2622772929338541e-05}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998337805059911, "res": {"Yes": 0.9998337805059911, "No": 0.0001660600646190051}, "ground_truth": 1}, {"key": "23434347", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 2.867614934389974e-07}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, " Yes": 1.3717477421032414e-07}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.918248385445633e-06, "res": {"No": 0.9999905085465441, "Yes": 8.918248385445633e-06}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.17288194781250538, "res": {"No": 0.8271177847305304, "Yes": 0.17288194781250538}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.011120589266188391, "res": {"No": 0.9888792612105688, "Yes": 0.011120589266188391}, "ground_truth": 1}, {"key": "34397620", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999928763541437, "res": {"Yes": 0.999928763541437, "No": 7.054251360763379e-05}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.021967587663554666, "res": {"No": 0.9780323507675243, "Yes": 0.021967587663554666}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.470572864249722e-06, "res": {"No": 0.9999932502087799, "Yes": 4.470572864249722e-06}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.02313260927451208, "res": {"No": 0.9768666211899315, "Yes": 0.02313260927451208}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992971094833558, "res": {"Yes": 0.9992971094833558, "No": 0.0007023631359553027}, "ground_truth": 1}, {"key": "34340916", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998837087823479, "res": {"Yes": 0.9998837087823479, "No": 0.00011598693529129096}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.014098202105166784, "res": {"No": 0.9859016803705173, "Yes": 0.014098202105166784}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.006019663007794229, "res": {"No": 0.9939801380164521, "Yes": 0.006019663007794229}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1478475653273241, "res": {"No": 0.8521519695858524, "Yes": 0.1478475653273241}, "ground_truth": 1}, {"key": "30375089", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.13088349534466676, "res": {"No": 0.8691162658269153, "Yes": 0.13088349534466676}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9903459355910081, "res": {"Yes": 0.9903459355910081, "No": 0.009652952035478618}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.016978847064863616, "res": {"No": 0.9830211463612237, "Yes": 0.016978847064863616}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.17170910224347177, "res": {"No": 0.8282908898914294, "Yes": 0.17170910224347177}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9895784921721862, "res": {"Yes": 0.9895784921721862, "No": 0.010421367638229342}, "ground_truth": 1}, {"key": "35807797", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.26272949821378444, "res": {"No": 0.7372704156838245, "Yes": 0.26272949821378444}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.05485734448218393, "res": {"No": 0.9451424567179756, "Yes": 0.05485734448218393}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0005351189496429442, "res": {"No": 0.9994646262636898, "Yes": 0.0005351189496429442}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.010401242591708522, "res": {"No": 0.9895984492028739, "Yes": 0.010401242591708522}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.13302485347300386, "res": {"No": 0.8669744691346988, "Yes": 0.13302485347300386}, "ground_truth": 1}, {"key": "34188172", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2627028325230224, "res": {"No": 0.7372969136587298, "Yes": 0.2627028325230224}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.057549110503383946, "res": {"No": 0.9424508118881062, "Yes": 0.057549110503383946}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.1062916407242876e-06, "res": {"No": 0.9999981375378344, "Yes": 1.1062916407242876e-06}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 9.044805825028817e-07, "res": {"No": 0.9999984951481323, "Yes": 9.044805825028817e-07}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 4.3243794527566633e-07, "res": {"No": 0.9999988527586581, "Yes": 4.3243794527566633e-07}, "ground_truth": 1}, {"key": "37075567", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00039983643779238024, "res": {"No": 0.9995997968026719, "Yes": 0.00039983643779238024}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.1327842700562924e-06, "res": {"No": 0.9999982567412194, "Yes": 1.1327842700562924e-06}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.3162166104866014e-06, "res": {"No": 0.9999958726752174, "Yes": 3.3162166104866014e-06}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8318045929405528, "res": {"Yes": 0.8318045929405528, "No": 0.1681951611983643}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976993111509193, "res": {"Yes": 0.9976993111509193, "No": 0.002300208058318101}, "ground_truth": 1}, {"key": "35559735", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.61011915794371, "res": {"Yes": 0.61011915794371, "No": 0.38988014796460635}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.30819345269837006, "res": {"No": 0.6918064493210815, "Yes": 0.30819345269837006}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.5536643734045417, "res": {"Yes": 0.5536643734045417, "No": 0.44633520434832175}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8030071989556758, "res": {"Yes": 0.8030071989556758, "No": 0.19699268163403583}, "ground_truth": 1}, {"key": "33005019", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6784401383871869, "res": {"Yes": 0.6784401383871869, "No": 0.32155862614503045}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9838159323970483, "res": {"Yes": 0.9838159323970483, "No": 0.01618377632437026}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.652649767556271e-05, "res": {"No": 0.9999024217570665, "Yes": 9.652649767556271e-05}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9569814511551897, "res": {"Yes": 0.9569814511551897, "No": 0.043017842822318776}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997906405487492, "res": {"Yes": 0.9997906405487492, "No": 0.00020911755500173168}, "ground_truth": 1}, {"key": "30808252", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.12522073738079895, "res": {"No": 0.8747791451736365, "Yes": 0.12522073738079895}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.591138464809298, "res": {"Yes": 0.591138464809298, "No": 0.4088609321304246}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.960758616082612e-05, "res": {"No": 0.9999303130782463, "Yes": 6.960758616082612e-05}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 6.801532571637694e-05, "res": {"No": 0.9999315050358871, "Yes": 6.801532571637694e-05}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9772477487206346, "res": {"Yes": 0.9772477487206346, "No": 0.02275193687150803}, "ground_truth": 1}, {"key": "15159017", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7433099582432924, "res": {"Yes": 0.7433099582432924, "No": 0.2566900379499737}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0595881231962193, "res": {"No": 0.940411757251672, "Yes": 0.0595881231962193}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0012114074663868806, "res": {"No": 0.9987883588306274, "Yes": 0.0012114074663868806}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9440597597692463, "res": {"Yes": 0.9440597597692463, "No": 0.055939854064383975}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999932502087799, "res": {"Yes": 0.9999932502087799, "No": 6.001404696822752e-06}, "ground_truth": 1}, {"key": "24493400", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9957108520820173, "res": {"Yes": 0.9957108520820173, "No": 0.004288445354281852}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999336505512221, "res": {"Yes": 0.9999336505512221, "No": 6.55397977893308e-05}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.03976098992474717, "res": {"No": 0.9602386275924102, "Yes": 0.03976098992474717}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.994654176344343, "res": {"Yes": 0.994654176344343, "No": 0.005345444372400996}, "ground_truth": 1}, {"key": "37791071", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984536055020526, "res": {"Yes": 0.9984536055020526, "No": 0.0015461968628838313}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996619724641854, "res": {"Yes": 0.9996619724641854, "No": 0.0003377589778939401}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00010951336076854359, "res": {"No": 0.9998900258575993, "Yes": 0.00010951336076854359}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.044062808368504236, "res": {"No": 0.955936967195874, "Yes": 0.044062808368504236}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9214246353222967, "res": {"Yes": 0.9214246353222967, "No": 0.07857492899168718}, "ground_truth": 1}, {"key": "33528627", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.018712820533581195, "res": {"No": 0.9812867395566919, "Yes": 0.018712820533581195}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.16321915043248764, "res": {"No": 0.8367805075329261, "Yes": 0.16321915043248764}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9873258057574468, "res": {"Yes": 0.9873258057574468, "No": 0.012674160049306762}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.808553516357786, "res": {"Yes": 0.808553516357786, "No": 0.19144630525336614}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985808929860035, "res": {"Yes": 0.9985808929860035, "No": 0.0014190456652959738}, "ground_truth": 1}, {"key": "39925662", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994736772164553, "res": {"Yes": 0.9994736772164553, "No": 0.0005262891928586291}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9831199950900975, "res": {"Yes": 0.9831199950900975, "No": 0.016879996452066195}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.306949691007469e-07, "res": {"No": 0.9999984951481323, "Yes": 6.306949691007469e-07}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.7202268572876475e-05, "res": {"No": 0.9999425902750013, "Yes": 5.7202268572876475e-05}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.056465079153059684, "res": {"No": 0.9435336214417601, "Yes": 0.056465079153059684}, "ground_truth": 1}, {"key": "29213416", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8484415609877527, "res": {"Yes": 0.8484415609877527, "No": 0.15155708898953427}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.1523043130571101, "res": {"No": 0.8476951167261301, "Yes": 0.1523043130571101}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.3733904518347252e-05, "res": {"No": 0.9999857404566682, "Yes": 1.3733904518347252e-05}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9849517783483054, "res": {"Yes": 0.9849517783483054, "No": 0.015047611570739607}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 5.783197040473425e-07}, "ground_truth": 1}, {"key": "34492745", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9819852677808825, "res": {"Yes": 0.9819852677808825, "No": 0.018014253019586136}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.028449622141268015, "res": {"No": 0.9715500774180632, "Yes": 0.028449622141268015}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.691231790050502, "res": {"Yes": 0.691231790050502, "No": 0.30876790525275166}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9645562287447201, "res": {"Yes": 0.9645562287447201, "No": 0.03544357796361238}, "ground_truth": 1}, {"key": "34191937", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999798995780161, "res": {"Yes": 0.9999798995780161, "No": 1.9886846990744646e-05}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995242804304538, "res": {"Yes": 0.9995242804304538, "No": 0.0004755411211059014}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.001351902120583776, "res": {"No": 0.9986472285213612, "Yes": 0.001351902120583776}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.27187390628691677, "res": {"No": 0.7281220163159279, "Yes": 0.27187390628691677}, "ground_truth": 1}, {"key": "34933372", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3682980095394892, "res": {"No": 0.6317012198628235, "Yes": 0.3682980095394892}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.35418323031394666, "res": {"No": 0.6458161068777692, "Yes": 0.35418323031394666}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 6.749089169747143e-06, "res": {"No": 0.9999862172649827, "Yes": 6.749089169747143e-06}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00039168457409722657, "res": {"No": 0.9996082495542522, "Yes": 0.00039168457409722657}, "ground_truth": 1}, {"key": "38714379", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 7.550603984167674e-06, "res": {"No": 0.9999911045595646, "Yes": 7.550603984167674e-06}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.2686070214065402e-05, "res": {"No": 0.9999764427474764, "Yes": 1.2686070214065402e-05}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0024144614954320852, "res": {"No": 0.997584932978213, "Yes": 0.0024144614954320852}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.2982386549387397e-05, "res": {"No": 0.9999864556687252, "Yes": 1.2982386549387397e-05}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0014721946976452085, "res": {"No": 0.9985276474760862, "Yes": 0.0014721946976452085}, "ground_truth": 1}, {"key": "39220660", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0066770166531692375, "res": {"No": 0.9933225360084741, "Yes": 0.0066770166531692375}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0004526510673693429, "res": {"No": 0.9995469076073742, "Yes": 0.0004526510673693429}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.435820950216162e-06, "res": {"No": 0.9999899125338788, "Yes": 5.435820950216162e-06}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0027551317923715595, "res": {"No": 0.997242797783413, "Yes": 0.0027551317923715595}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00507984261078825, "res": {"No": 0.9949200786643572, "Yes": 0.00507984261078825}, "ground_truth": 1}, {"key": "41028780", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9680753924267894, "res": {"Yes": 0.9680753924267894, "No": 0.0319243256573754}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9962232225324181, "res": {"Yes": 0.9962232225324181, "No": 0.00377682337367609}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9955924439112234, "res": {"Yes": 0.9955924439112234, "No": 0.004407372376921341}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9975154228838028, "res": {"Yes": 0.9975154228838028, "No": 0.0024835921977171306}, "ground_truth": 1}, {"key": "39457108", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.937086429814802, "res": {"Yes": 0.937086429814802, "No": 0.06291105346194681}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.009575517484473538, "res": {"No": 0.9904241680869823, "Yes": 0.009575517484473538}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 7.219831090505689e-06, "res": {"No": 0.9999917005724405, "Yes": 7.219831090505689e-06}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9886967264978757, "res": {"Yes": 0.9886967264978757, "No": 0.011302763789814556}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5562769484630741, "res": {"Yes": 0.5562769484630741, "No": 0.443722638416518}, "ground_truth": 1}, {"key": "38288018", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1090379600544766, "res": {"No": 0.890961314966422, "Yes": 0.1090379600544766}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.008260435242837495, "res": {"No": 0.9917393740385246, "Yes": 0.008260435242837495}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0022150291838916145, "res": {"No": 0.9977844006715977, "Yes": 0.0022150291838916145}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9970481799132448, "res": {"Yes": 0.9970481799132448, "No": 0.0029508766006760704}, "ground_truth": 1}, {"key": "40106293", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0007802072253811751, "res": {"No": 0.9992197431588021, "Yes": 0.0007802072253811751}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.003039474622638063, "res": {"No": 0.9969600101552591, "Yes": 0.003039474622638063}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.06497115349344722, "res": {"No": 0.9350285082979782, "Yes": 0.06497115349344722}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.16722977734830433, "res": {"No": 0.8327699545182501, "Yes": 0.16722977734830433}, "ground_truth": 1}, {"key": "39948797", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.008934514220568554, "res": {"No": 0.991065289876926, "Yes": 0.008934514220568554}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8061944923015251, "res": {"Yes": 0.8061944923015251, "No": 0.19380505427794262}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0012002300886816673, "res": {"No": 0.9987994203730752, "Yes": 0.0012002300886816673}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998695326316075, "res": {"Yes": 0.9998695326316075, "No": 0.00013022979683936095}, "ground_truth": 1}, {"key": "31853399", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9922781736707105, "res": {"Yes": 0.9922781736707105, "No": 0.00772036219187493}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8818473769108847, "res": {"Yes": 0.8818473769108847, "No": 0.11815236011108231}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.007088924801061368, "res": {"No": 0.9929080837705434, "Yes": 0.007088924801061368}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.4178239531019783, "res": {"No": 0.5821660690166296, "Yes": 0.4178239531019783}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995038056851366, "res": {"Yes": 0.9995038056851366, "No": 0.0004891490545037217}, "ground_truth": 1}, {"key": "35273252", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9344187880838827, "res": {"Yes": 0.9344187880838827, "No": 0.06557771835184661}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0013082341869009861, "res": {"No": 0.9986837238523855, "Yes": 0.0013082341869009861}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.000196841149936044, "res": {"No": 0.999793858390102, "Yes": 0.000196841149936044}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.011003934371457288, "res": {"No": 0.988994445158071, "Yes": 0.011003934371457288}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999920581810364, "res": {"Yes": 0.9999920581810364, "No": 5.279316074398162e-06}, "ground_truth": 1}, {"key": "37130459", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999958085982417, "res": {"Yes": 0.999958085982417, "No": 3.7801378036922295e-05}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999968263007362, "res": {"Yes": 0.9999968263007362, "No": 1.948204263853801e-06}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00020233880765163574, "res": {"No": 0.9997965995086854, "Yes": 0.00020233880765163574}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.702389770785334, "res": {"Yes": 0.702389770785334, "No": 0.2976091293245293}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4152817389733435, "res": {"No": 0.5847169470737537, "Yes": 0.4152817389733435}, "ground_truth": 1}, {"key": "21734003", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9963358769420126, "res": {"Yes": 0.9963358769420126, "No": 0.003663647658014063}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.33288922566650525, "res": {"No": 0.6671096658598192, "Yes": 0.33288922566650525}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 7.86832703583728e-05, "res": {"No": 0.9999212542766073, "Yes": 7.86832703583728e-05}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.174403697690992e-05, "res": {"No": 0.9999779923581718, "Yes": 2.174403697690992e-05}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985656785237074, "res": {"Yes": 0.9985656785237074, "No": 0.001433482615536072}, "ground_truth": 1}, {"key": "33990737", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00023346882536096942, "res": {"No": 0.999766332054608, "Yes": 0.00023346882536096942}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00010423589564619936, "res": {"No": 0.9998953894470656, "Yes": 0.00010423589564619936}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9425727974207652, "res": {"Yes": 0.9425727974207652, "No": 0.05742431839266575}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.21079792622618776, "res": {"No": 0.7892015269722149, "Yes": 0.21079792622618776}, "ground_truth": 1}, {"key": "34559912", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0004261371564569785, "res": {"No": 0.9995734673409293, "Yes": 0.0004261371564569785}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 2.122930541351131e-05, "res": {"No": 0.9999773963544663, "Yes": 2.122930541351131e-05}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.324046086247535e-06, "res": {"No": 0.9999953958625991, "Yes": 4.324046086247535e-06}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0005186281528923765, "res": {"No": 0.9994812986121021, "Yes": 0.0005186281528923765}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.698011235251818, "res": {"Yes": 0.698011235251818, "No": 0.3019877878523162}, "ground_truth": 1}, {"key": "39820439", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9719642286493316, "res": {"Yes": 0.9719642286493316, "No": 0.028035248094209004}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.08294824665010539, "res": {"No": 0.917051277071051, "Yes": 0.08294824665010539}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0001275558818967827, "res": {"No": 0.9998714396345921, "Yes": 0.0001275558818967827}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.002205557428481392, "res": {"No": 0.9977943659932846, "Yes": 0.002205557428481392}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.010761245264966132, "res": {"No": 0.9892386639688514, "Yes": 0.010761245264966132}, "ground_truth": 1}, {"key": "34759328", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.006703586481892884, "res": {"No": 0.9932963061832474, "Yes": 0.006703586481892884}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 3.8750693443614435e-06, "res": {"No": 0.9999946806438478, "Yes": 3.8750693443614435e-06}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0008435258587140151, "res": {"No": 0.9991561840730588, "Yes": 0.0008435258587140151}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.001292564176262548, "res": {"No": 0.9987071470553884, "Yes": 0.001292564176262548}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9836852175233434, "res": {"Yes": 0.9836852175233434, "No": 0.016313204615698542}, "ground_truth": 1}, {"key": "36939137", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.13295587137356152, "res": {"No": 0.8670440119458452, "Yes": 0.13295587137356152}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.004219989242956104, "res": {"No": 0.9957777494700745, "Yes": 0.004219989242956104}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.001036246322888704, "res": {"No": 0.9989627280388621, "Yes": 0.001036246322888704}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.11725585932303531, "res": {"No": 0.8827438986063677, "Yes": 0.11725585932303531}, "ground_truth": 1}, {"key": "35851522", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999628539429318, "res": {"Yes": 0.9999628539429318, "No": 3.700550028562755e-05}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9143754144019287, "res": {"Yes": 0.9143754144019287, "No": 0.08562408231039612}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.9179587414039974e-05, "res": {"No": 0.9999804955832136, "Yes": 1.9179587414039974e-05}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.288130579661272, "res": {"No": 0.7118688813045498, "Yes": 0.288130579661272}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999478349506435, "res": {"Yes": 0.9999478349506435, "No": 5.184088159440212e-05}, "ground_truth": 1}, {"key": "22412782", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.0610431818094132e-06}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987901409702861, "res": {"Yes": 0.9987901409702861, "No": 0.0012089815113268934}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.548766500854072e-07, "res": {"No": 0.9999984951481323, "Yes": 5.548766500854072e-07}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.0516296041099179e-05, "res": {"No": 0.9999891973193493, "Yes": 1.0516296041099179e-05}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9557266622133556, "res": {"Yes": 0.9557266622133556, "No": 0.04427169700070484}, "ground_truth": 1}, {"key": "38579227", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.47217482501208474, "res": {"No": 0.527823199912907, "Yes": 0.47217482501208474}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.006553642349494756, "res": {"No": 0.9934457079903865, "Yes": 0.006553642349494756}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.699990831475767e-06, "res": {"No": 0.9999938462231346, "Yes": 4.699990831475767e-06}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.4407654832898435e-06, "res": {"No": 0.9999976607241361, "Yes": 1.4407654832898435e-06}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 6.504833168441838e-05, "res": {"No": 0.9999343657340227, "Yes": 6.504833168441838e-05}, "ground_truth": 1}, {"key": "37206995", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00031570952241339207, "res": {"No": 0.9996834147936756, "Yes": 0.00031570952241339207}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.011820042162064658, "res": {"No": 0.9881790232767974, "Yes": 0.011820042162064658}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.026069638960027487, "res": {"No": 0.9739293411418707, "Yes": 0.026069638960027487}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7782027380483532, "res": {"Yes": 0.7782027380483532, "No": 0.22179580892140735}, "ground_truth": 1}, {"key": "38700847", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5794779598333889, "res": {"Yes": 0.5794779598333889, "No": 0.4205211094486591}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9134757178156171, "res": {"Yes": 0.9134757178156171, "No": 0.0865210795944081}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0003289811841065107, "res": {"No": 0.9996700719782239, "Yes": 0.0003289811841065107}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.4212565114445066, "res": {"No": 0.5787401807687038, "Yes": 0.4212565114445066}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.18781014376659877, "res": {"No": 0.8121894201323652, "Yes": 0.18781014376659877}, "ground_truth": 1}, {"key": "20246590", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.015475889225414988, "res": {"No": 0.9845233623666533, "Yes": 0.015475889225414988}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9917951867339809, "res": {"Yes": 0.9917951867339809, "No": 0.008199896883286187}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0003690084553347348, "res": {"No": 0.9996304093354627, "Yes": 0.0003690084553347348}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3263432295807923, "res": {"No": 0.6736557602577632, "Yes": 0.3263432295807923}, "ground_truth": 1}, {"key": "39141360", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0011815533593249141, "res": {"No": 0.9988178528870594, "Yes": 0.0011815533593249141}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.040773582297267116, "res": {"No": 0.959226253921151, "Yes": 0.040773582297267116}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0012526499645461547, "res": {"No": 0.9987467438822084, "Yes": 0.0012526499645461547}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5181924710513035, "res": {"Yes": 0.5181924710513035, "No": 0.481806821758792}, "ground_truth": 1}, {"key": "37906226", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.08539258573908658, "res": {"No": 0.9146067934528636, "Yes": 0.08539258573908658}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 3.229074181295803e-05, "res": {"No": 0.9999667875255465, "Yes": 3.229074181295803e-05}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0017149718714253395, "res": {"No": 0.9982848832965631, "Yes": 0.0017149718714253395}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999887205106139, "res": {"Yes": 0.9999887205106139, "No": 1.1084220917001436e-05}, "ground_truth": 1}, {"key": "16201033", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999924157887603, "res": {"Yes": 0.9999924157887603, "No": 7.0279886683390015e-06}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998981308540138, "res": {"Yes": 0.9998981308540138, "No": 0.00010169372071818196}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.003208773617737e-06, "res": {"No": 0.9999907469518097, "Yes": 8.003208773617737e-06}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00018524208884317036, "res": {"No": 0.9998145957494927, "Yes": 0.00018524208884317036}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9351608840433259, "res": {"Yes": 0.9351608840433259, "No": 0.06483897437642627}, "ground_truth": 1}, {"key": "36469022", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.007922983813319864, "res": {"No": 0.9920764620383308, "Yes": 0.007922983813319864}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.010452286716128537, "res": {"No": 0.9895469726200367, "Yes": 0.010452286716128537}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 5.077660164606042e-06, "res": {"No": 0.9999940846288958, "Yes": 5.077660164606042e-06}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.07252081897990911, "res": {"No": 0.9274780041350797, "Yes": 0.07252081897990911}, "ground_truth": 1}, {"key": "31295270", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.26354783248961994, "res": {"No": 0.7364503932987125, "Yes": 0.26354783248961994}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.10545920324003495, "res": {"No": 0.8945396862971987, "Yes": 0.10545920324003495}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.005718279531731382, "res": {"No": 0.9942811522239712, "Yes": 0.005718279531731382}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999011106398752, "res": {"Yes": 0.9999011106398752, "No": 9.870736443223396e-05}, "ground_truth": 1}, {"key": "35360689", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.996820582088, "res": {"Yes": 0.996820582088, "No": 0.003178865203890883}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.35523295267378713, "res": {"No": 0.6447669276309952, "Yes": 0.35523295267378713}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.8420465146754434e-05, "res": {"No": 0.9999515300767047, "Yes": 4.8420465146754434e-05}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.08883167430143157, "res": {"No": 0.9111678596718075, "Yes": 0.08883167430143157}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.03571043628515423, "res": {"No": 0.9642890084561132, "Yes": 0.03571043628515423}, "ground_truth": 1}, {"key": "29202793", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07806138301919949, "res": {"No": 0.9219381685357244, "Yes": 0.07806138301919949}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.15448524327332303, "res": {"No": 0.8455124971264385, "Yes": 0.15448524327332303}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.9877824746448482e-05, "res": {"No": 0.9999614235510903, "Yes": 2.9877824746448482e-05}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999515300767047, "res": {"Yes": 0.9999515300767047, "No": 4.803981075892243e-05}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.626369719776068e-06}, "ground_truth": 1}, {"key": "35999008", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8041508765565303, "res": {"Yes": 0.8041508765565303, "No": 0.19584859358079748}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.6483631778393988, "res": {"Yes": 0.6483631778393988, "No": 0.3516359399877029}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.747848148801174e-06, "res": {"No": 0.9999881244990143, "Yes": 9.747848148801174e-06}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991005003925306, "res": {"Yes": 0.9991005003925306, "No": 0.0008993214710832039}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998931248215588, "res": {"Yes": 0.9998931248215588, "No": 0.0001066975885706053}, "ground_truth": 1}, {"key": "31797119", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999722971309536, "res": {"Yes": 0.999722971309536, "No": 0.00027687649988158714}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984126070431021, "res": {"Yes": 0.9984126070431021, "No": 0.0015872608249449562}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.799513705823882e-05, "res": {"No": 0.9999812107925193, "Yes": 1.799513705823882e-05}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.007231831177383353, "res": {"No": 0.9927660101793356, "Yes": 0.007231831177383353}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0010571334780304946, "res": {"No": 0.9989397677438011, "Yes": 0.0010571334780304946}, "ground_truth": 1}, {"key": "26711893", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.017623631124412835, "res": {"No": 0.9823752188690464, "Yes": 0.017623631124412835}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 5.72216634291651e-05, "res": {"No": 0.9999423518847165, "Yes": 5.72216634291651e-05}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.3218743908727828, "res": {"No": 0.6781252320905674, "Yes": 0.3218743908727828}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 5.561687953558836e-07}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 1.0230522469618063e-06}, "ground_truth": 1}, {"key": "35348288", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6598759870670738, "res": {"Yes": 0.6598759870670738, "No": 0.3401237013639811}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8527752397980218, "res": {"Yes": 0.8527752397980218, "No": 0.1472243448725126}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.129942419930189e-05, "res": {"No": 0.9999584435804919, "Yes": 4.129942419930189e-05}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9958128616108624, "res": {"Yes": 0.9958128616108624, "No": 0.004186448156043799}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9925261412268934, "res": {"Yes": 0.9925261412268934, "No": 0.0074709381402899835}, "ground_truth": 1}, {"key": "38124131", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9903861652503367, "res": {"Yes": 0.9903861652503367, "No": 0.009613178129564233}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9970089503288123, "res": {"Yes": 0.9970089503288123, "No": 0.002989925823742932}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.36282837963435e-06, "res": {"No": 0.999994561441089, "Yes": 4.36282837963435e-06}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 9.676153580843231e-05, "res": {"No": 0.9999028985246534, "Yes": 9.676153580843231e-05}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1155740995711471, "res": {"No": 0.8844256745036428, "Yes": 0.1155740995711471}, "ground_truth": 1}, {"key": "20285901", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.01552806883756895, "res": {"No": 0.9844718337623823, "Yes": 0.01552806883756895}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.0017955603357995e-06, "res": {"No": 0.9999976607241361, "Yes": 2.0017955603357995e-06}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.020940213035005945, "res": {"No": 0.9790597007033821, "Yes": 0.020940213035005945}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 6.822450041457619e-07}, "ground_truth": 1}, {"key": "35633632", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00046069732150830716, "res": {"No": 0.9995391702146781, "Yes": 0.00046069732150830716}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9648305817591643, "res": {"Yes": 0.9648305817591643, "No": 0.03516929423297448}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.06855723055366222, "res": {"No": 0.9314412325319404, "Yes": 0.06855723055366222}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9979652968207078, "res": {"Yes": 0.9979652968207078, "No": 0.002034033726757251}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9720791157787235, "res": {"Yes": 0.9720791157787235, "No": 0.027920298775974607}, "ground_truth": 1}, {"key": "10741274", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999942038320978, "res": {"Yes": 0.9999942038320978, "No": 5.2065870168390985e-06}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994873712390449, "res": {"Yes": 0.9994873712390449, "No": 0.0005122880978821554}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.221331324205713e-06, "res": {"No": 0.9999928926002577, "Yes": 4.221331324205713e-06}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.22142233124399405, "res": {"No": 0.7785775328913408, "Yes": 0.22142233124399405}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.05708656950822265, "res": {"No": 0.9429130880241896, "Yes": 0.05708656950822265}, "ground_truth": 1}, {"key": "30605795", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07904519511760523, "res": {"No": 0.9209545338636894, "Yes": 0.07904519511760523}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.553714094697726, "res": {"Yes": 0.553714094697726, "No": 0.44628505247924466}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0009998696874735518, "res": {"No": 0.9989908019831943, "Yes": 0.0009998696874735518}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8298163979089997, "res": {"Yes": 0.8298163979089997, "No": 0.17018339998542759}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6877568632135379, "res": {"Yes": 0.6877568632135379, "No": 0.31224295258967694}, "ground_truth": 1}, {"key": "30539722", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995629893169975, "res": {"Yes": 0.9995629893169975, "No": 0.00043674096327744953}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.01816187794658487, "res": {"No": 0.9818374567361554, "Yes": 0.01816187794658487}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.25947691095026e-06, "res": {"No": 0.9999886013079656, "Yes": 9.25947691095026e-06}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999819260003368, "res": {"Yes": 0.9999819260003368, "No": 1.753657251062125e-05}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9964968317621217, "res": {"Yes": 0.9964968317621217, "No": 0.003502154249401847}, "ground_truth": 1}, {"key": "18639299", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999960112362533, "res": {"Yes": 0.999960112362533, "No": 3.925746267348825e-05}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7887045418036971, "res": {"Yes": 0.7887045418036971, "No": 0.21129456001632285}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.05631175350468767, "res": {"No": 0.9436853982002591, "Yes": 0.05631175350468767}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9695391902113718, "res": {"Yes": 0.9695391902113718, "No": 0.030453763390502923}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9549575020144625, "res": {"Yes": 0.9549575020144625, "No": 0.0450383018056029}, "ground_truth": 1}, {"key": "39773552", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.023924261725202657, "res": {"No": 0.9760735663997969, "Yes": 0.023924261725202657}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9977000210142316, "res": {"Yes": 0.9977000210142316, "No": 0.002292111119150658}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.107947453191526e-07, "res": {"No": 0.9999987335551019, "Yes": 5.107947453191526e-07}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.769798459948927e-07}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 7.733702639350673e-08}, "ground_truth": 1}, {"key": "34086410", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, " Yes": 1.0556805720734008e-07}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 3.552372360858643e-07}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.024654831343267476, "res": {"No": 0.9753448443537063, "Yes": 0.024654831343267476}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.009646832074142587, "res": {"No": 0.9903528343648239, "Yes": 0.009646832074142587}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9715336583604963, "res": {"Yes": 0.9715336583604963, "No": 0.028464337245139484}, "ground_truth": 1}, {"key": "35454652", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0005762845550912951, "res": {"No": 0.999423065650661, "Yes": 0.0005762845550912951}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.024768098615841474, "res": {"No": 0.9752317967340219, "Yes": 0.024768098615841474}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.562907038826548e-07, "res": {"No": 0.9999981375378344, "Yes": 6.562907038826548e-07}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9939983943191065, "res": {"Yes": 0.9939983943191065, "No": 0.00600106695337904}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968251944871863, "res": {"Yes": 0.9968251944871863, "No": 0.00317458837725872}, "ground_truth": 1}, {"key": "36158310", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988711395428842, "res": {"Yes": 0.9988711395428842, "No": 0.0011281174601374877}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9859279776767503, "res": {"Yes": 0.9859279776767503, "No": 0.0140711257555657}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00032547659619216427, "res": {"No": 0.9996741235592657, "Yes": 0.00032547659619216427}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7060378366050108, "res": {"Yes": 0.7060378366050108, "No": 0.293960169121547}, "ground_truth": 1}, {"key": "35688387", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.016934014288272608, "res": {"No": 0.9830640080006245, "Yes": 0.016934014288272608}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7358845749982506, "res": {"Yes": 0.7358845749982506, "No": 0.26411499065666566}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997728867541188, "res": {"Yes": 0.9997728867541188, "No": 0.0002265726304963484}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.0143137324605816e-06}, "ground_truth": 1}, {"key": "34209292", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9953725902045493, "res": {"Yes": 0.9953725902045493, "No": 0.004627283037884502}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 1.3669263114131403e-07}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.10244022717640115, "res": {"No": 0.8975585086932133, "Yes": 0.10244022717640115}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999964686909351, "res": {"Yes": 0.9999964686909351, "No": 3.16360929562317e-06}, "ground_truth": 1}, {"key": "25037859", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999950382530095, "res": {"Yes": 0.9999950382530095, "No": 4.694898801793159e-06}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999228038037797, "res": {"Yes": 0.9999228038037797, "No": 7.613655908348878e-05}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00010273979790292894, "res": {"No": 0.9998969389311568, "Yes": 0.00010273979790292894}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.20140672661004114, "res": {"No": 0.7985932473488677, "Yes": 0.20140672661004114}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998789411982082, "res": {"Yes": 0.9998789411982082, "No": 0.00012067512989677807}, "ground_truth": 1}, {"key": "36412121", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999539140419904, "res": {"Yes": 0.9999539140419904, "No": 4.566472225812382e-05}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9955174109274891, "res": {"Yes": 0.9955174109274891, "No": 0.004482138512090696}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.5735355825613036e-05, "res": {"No": 0.9999584435804919, "Yes": 3.5735355825613036e-05}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0470484903285533, "res": {"No": 0.9529509115938213, "Yes": 0.0470484903285533}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.001573937244276496, "res": {"No": 0.9984246018445321, "Yes": 0.001573937244276496}, "ground_truth": 1}, {"key": "34909172", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0005922523778443292, "res": {"No": 0.999406870770727, "Yes": 0.0005922523778443292}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00031447058990878904, "res": {"No": 0.9996847256294127, "Yes": 0.00031447058990878904}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0003947620814409334, "res": {"No": 0.9996049131873577, "Yes": 0.0003947620814409334}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0506827633277923, "res": {"No": 0.949316796203087, "Yes": 0.0506827633277923}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4962921319151016, "res": {"No": 0.5037077702522518, "Yes": 0.4962921319151016}, "ground_truth": 1}, {"key": "39011806", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.03409095769810613, "res": {"No": 0.96590766425072, "Yes": 0.03409095769810613}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.4787153294562477, "res": {"No": 0.521284490100303, "Yes": 0.4787153294562477}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.7431501916311788e-05, "res": {"No": 0.9999715555225518, "Yes": 2.7431501916311788e-05}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0021050585447537178, "res": {"No": 0.9978947864769563, "Yes": 0.0021050585447537178}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998907410091983, "res": {"Yes": 0.9998907410091983, "No": 0.00010893959539854406}, "ground_truth": 1}, {"key": "33096163", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9337338822462674, "res": {"Yes": 0.9337338822462674, "No": 0.06626518717566314}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.045103501360462914, "res": {"No": 0.9548962988395813, "Yes": 0.045103501360462914}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.021019666069123134, "res": {"No": 0.9789802874966043, "Yes": 0.021019666069123134}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.6067486435363062, "res": {"Yes": 0.6067486435363062, "No": 0.3932511038715039}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996364755210411, "res": {"Yes": 0.9996364755210411, "No": 0.00036312806128668845}, "ground_truth": 1}, {"key": "38762205", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9976322719006505, "res": {"Yes": 0.9976322719006505, "No": 0.002367657995422004}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999943230348141, "res": {"Yes": 0.9999943230348141, "No": 5.538460410884911e-06}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00011410368561460586, "res": {"No": 0.9998854966360107, "Yes": 0.00011410368561460586}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999148177982098, "res": {"Yes": 0.9999148177982098, "No": 8.49768237854898e-05}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999967070975216, "res": {"Yes": 0.9999967070975216, "No": 2.9379455893684233e-06}, "ground_truth": 1}, {"key": "35519177", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999193471666147, "res": {"Yes": 0.9999193471666147, "No": 8.039400091888319e-05}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.3489473640433615e-06}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.008783523869288865, "res": {"No": 0.9912163585699207, "Yes": 0.008783523869288865}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9947569092342994, "res": {"Yes": 0.9947569092342994, "No": 0.005242596437661126}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994777243634263, "res": {"Yes": 0.9994777243634263, "No": 0.0005204475205835613}, "ground_truth": 1}, {"key": "36192531", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999995276659155, "res": {"Yes": 0.999995276659155, "No": 4.069843546141945e-06}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994517628669264, "res": {"Yes": 0.9994517628669264, "No": 0.0005462222575161365}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.07701500546080392, "res": {"No": 0.9229808659277103, "Yes": 0.07701500546080392}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9145097825971105, "res": {"Yes": 0.9145097825971105, "No": 0.08548586827786818}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8433453221850703, "res": {"Yes": 0.8433453221850703, "No": 0.1566457331602349}, "ground_truth": 1}, {"key": "33160852", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.997688744773008, "res": {"Yes": 0.997688744773008, "No": 0.002303849176222933}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00024943479989241975, "res": {"No": 0.9997491818801253, "Yes": 0.00024943479989241975}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00022136801835463457, "res": {"No": 0.9997784880673918, "Yes": 0.00022136801835463457}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0005657139478534442, "res": {"No": 0.9994341415583088, "Yes": 0.0005657139478534442}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.052117473634163795, "res": {"No": 0.9478823801465491, "Yes": 0.052117473634163795}, "ground_truth": 1}, {"key": "36312304", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1663995258596883, "res": {"No": 0.8336003901107489, "Yes": 0.1663995258596883}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.2896227977663696, "res": {"No": 0.7103772230260347, "Yes": 0.2896227977663696}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.09291836193518566, "res": {"No": 0.9070814149461714, "Yes": 0.09291836193518566}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993963944131913, "res": {"Yes": 0.9993963944131913, "No": 0.0006034850439023322}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999978707566687, "res": {"Yes": 0.999978707566687, "No": 2.0945159257280174e-05}, "ground_truth": 1}, {"key": "33773343", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9500159500520684, "res": {"Yes": 0.9500159500520684, "No": 0.04998349140363713}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999974535534225, "res": {"Yes": 0.999974535534225, "No": 2.5308531642632223e-05}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.771000515012135e-05, "res": {"No": 0.9999256644730222, "Yes": 5.771000515012135e-05}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.12499546779214513, "res": {"No": 0.8750027935509167, "Yes": 0.12499546779214513}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5202979607848591, "res": {"Yes": 0.5202979607848591, "No": 0.47969958288861614}, "ground_truth": 1}, {"key": "34913320", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.11243620329630365, "res": {"No": 0.8875629327550825, "Yes": 0.11243620329630365}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.27943451701723854, "res": {"No": 0.7205635246326518, "Yes": 0.27943451701723854}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.2221980006037577, "res": {"No": 0.7778019112595574, "Yes": 0.2221980006037577}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9972733874786923, "res": {"Yes": 0.9972733874786923, "No": 0.0027264845778639936}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.11033511989527217, "res": {"No": 0.8896646135369802, "Yes": 0.11033511989527217}, "ground_truth": 1}, {"key": "33784155", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9839010922382458, "res": {"Yes": 0.9839010922382458, "No": 0.01609829360300136}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7830596535544787, "res": {"Yes": 0.7830596535544787, "No": 0.2169399265376345}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.000723041671888268, "res": {"No": 0.9992738923438429, "Yes": 0.000723041671888268}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.5253173094571534, "res": {"Yes": 0.5253173094571534, "No": 0.4746760536147949}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7614719062298698, "res": {"Yes": 0.7614719062298698, "No": 0.23852527486306518}, "ground_truth": 1}, {"key": "24085062", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1934736019209621, "res": {"No": 0.8065244787891895, "Yes": 0.1934736019209621}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.29068766627266424, "res": {"No": 0.7093105053598624, "Yes": 0.29068766627266424}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.21601986671393167, "res": {"No": 0.7839798503862131, "Yes": 0.21601986671393167}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9958114405869227, "res": {"Yes": 0.9958114405869227, "No": 0.004188297299810403}, "ground_truth": 1}, {"key": "33893487", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999056399421903, "res": {"Yes": 0.9999056399421903, "No": 9.410155373302074e-05}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.014866968591279355, "res": {"No": 0.9851323316312692, "Yes": 0.014866968591279355}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.2679011761721465e-06, "res": {"No": 0.9999932502087799, "Yes": 6.2679011761721465e-06}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.033155853558655135, "res": {"No": 0.9668440321228091, "Yes": 0.033155853558655135}, "ground_truth": 1}, {"key": "40913011", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2793152239493547, "res": {"No": 0.7206846183013362, "Yes": 0.2793152239493547}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.007878194702712482, "res": {"No": 0.9921216402449138, "Yes": 0.007878194702712482}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9601741113264705, "res": {"Yes": 0.9601741113264705, "No": 0.039825104468520466}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8388650346467614, "res": {"Yes": 0.8388650346467614, "No": 0.16113444505740498}, "ground_truth": 1}, {"key": "29642545", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975857617721196, "res": {"Yes": 0.9975857617721196, "No": 0.0024124655612079208}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999431862619615, "res": {"Yes": 0.9999431862619615, "No": 5.6361007214828586e-05}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0053941809947398, "res": {"No": 0.9946057057396769, "Yes": 0.0053941809947398}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0005264916952599616, "res": {"No": 0.999473438981938, "Yes": 0.0005264916952599616}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7565261191835837, "res": {"Yes": 0.7565261191835837, "No": 0.2434737366443412}, "ground_truth": 1}, {"key": "35969159", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.20857848118626404, "res": {"No": 0.7914213601986404, "Yes": 0.20857848118626404}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.04204974318306596, "res": {"No": 0.9579500138329281, "Yes": 0.04204974318306596}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.1669292573265034e-06, "res": {"No": 0.9999930118027176, "Yes": 5.1669292573265034e-06}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8083931718399765, "res": {"Yes": 0.8083931718399765, "No": 0.191606306319915}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980987545612131, "res": {"Yes": 0.9980987545612131, "No": 0.001900888253904084}, "ground_truth": 1}, {"key": "37081669", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996587550872944, "res": {"Yes": 0.9996587550872944, "No": 0.00034101001895931946}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978858795074221, "res": {"Yes": 0.9978858795074221, "No": 0.002113891959463986}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0018403393408321983, "res": {"No": 0.998159443804812, "Yes": 0.0018403393408321983}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999727475263555, "res": {"Yes": 0.9999727475263555, "No": 2.7097041656614578e-05}, "ground_truth": 1}, {"key": "40048022", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9920460732175832, "res": {"Yes": 0.9920460732175832, "No": 0.007953720280210652}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8696852016467692, "res": {"Yes": 0.8696852016467692, "No": 0.13031433311739937}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0021476314398396297, "res": {"No": 0.997851929612407, "Yes": 0.0021476314398396297}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9959963594250022, "res": {"Yes": 0.9959963594250022, "No": 0.004003605295242575}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995922900163132, "res": {"Yes": 0.9995922900163132, "No": 0.000407392974110081}, "ground_truth": 1}, {"key": "32884004", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9975693881323513, "res": {"Yes": 0.9975693881323513, "No": 0.0024302989609490773}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999874092852638, "res": {"Yes": 0.9999874092852638, "No": 1.217385425243626e-05}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.000904770714959241, "res": {"No": 0.9990950218799214, "Yes": 0.000904770714959241}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.19677579397960104, "res": {"No": 0.8032223373384806, "Yes": 0.19677579397960104}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00018271024876727064, "res": {"No": 0.9998169757209873, "Yes": 0.00018271024876727064}, "ground_truth": 1}, {"key": "39022490", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.021269958518648158, "res": {"No": 0.9787285476765857, "Yes": 0.021269958518648158}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0008650144032629357, "res": {"No": 0.9991347677594673, "Yes": 0.0008650144032629357}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.6009488183781142e-05, "res": {"No": 0.999983475621529, "Yes": 1.6009488183781142e-05}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1688810091356721, "res": {"No": 0.8311188283043567, "Yes": 0.1688810091356721}, "ground_truth": 1}, {"key": "35159385", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0008035219943351407, "res": {"No": 0.9991964123896011, "Yes": 0.0008035219943351407}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 2.5012898978781853e-06, "res": {"No": 0.9999971839107652, "Yes": 2.5012898978781853e-06}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8065878983022622, "res": {"Yes": 0.8065878983022622, "No": 0.19341131345012555}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1206231326577892, "res": {"No": 0.8793763464239504, "Yes": 0.1206231326577892}, "ground_truth": 1}, {"key": "34363669", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9533290918067545, "res": {"Yes": 0.9533290918067545, "No": 0.04666917950289525}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.08987929279683322, "res": {"No": 0.910120259414463, "Yes": 0.08987929279683322}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0026185996207498154, "res": {"No": 0.9973792701242795, "Yes": 0.0026185996207498154}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0700119316020584, "res": {"No": 0.9299879313147058, "Yes": 0.0700119316020584}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987232006028353, "res": {"Yes": 0.9987232006028353, "No": 0.001276722157496917}, "ground_truth": 1}, {"key": "36119687", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9979472514759722, "res": {"Yes": 0.9979472514759722, "No": 0.002052532258652359}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9961605227140718, "res": {"Yes": 0.9961605227140718, "No": 0.0038391895090941126}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998984884226488, "res": {"Yes": 0.9998984884226488, "No": 0.0001011663870558245}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999173208681078, "res": {"Yes": 0.9999173208681078, "No": 8.237323432246317e-05}, "ground_truth": 1}, {"key": "35217446", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995955072092758, "res": {"Yes": 0.9995955072092758, "No": 0.00040431349629194575}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9736045772050262, "res": {"Yes": 0.9736045772050262, "No": 0.026395115629002854}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.019254871217508095, "res": {"No": 0.9807385781465552, "Yes": 0.019254871217508095}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0003678365044144776, "res": {"No": 0.999621472439641, "Yes": 0.0003678365044144776}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5978639017384285, "res": {"Yes": 0.5978639017384285, "No": 0.40213320078882325}, "ground_truth": 1}, {"key": "39049331", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.11617890401158383, "res": {"No": 0.8838194184354459, "Yes": 0.11617890401158383}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.7117760632203736e-05, "res": {"No": 0.9999689331225854, "Yes": 1.7117760632203736e-05}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.001312842690571828, "res": {"No": 0.99868705356934, "Yes": 0.001312842690571828}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0002098927231319416, "res": {"No": 0.999789806303791, "Yes": 0.0002098927231319416}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 6.044806447660196e-05, "res": {"No": 0.9999393719679535, "Yes": 6.044806447660196e-05}, "ground_truth": 1}, {"key": "36472242", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.002281688591101273, "res": {"No": 0.9977182962524317, "Yes": 0.002281688591101273}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0031512912169246307, "res": {"No": 0.9968482891011355, "Yes": 0.0031512912169246307}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.4302088248447327e-05, "res": {"No": 0.9999855020530962, "Yes": 1.4302088248447327e-05}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993934161464159, "res": {"Yes": 0.9993934161464159, "No": 0.0006064880700077067}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998978924633294, "res": {"Yes": 0.9998978924633294, "No": 0.00010201150060566425}, "ground_truth": 1}, {"key": "31854721", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999958726752174, "res": {"Yes": 0.9999958726752174, "No": 4.069916803985097e-06}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9563611110780837, "res": {"Yes": 0.9563611110780837, "No": 0.04363863923948925}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999804955832136, "res": {"Yes": 0.9999804955832136, "No": 1.9210011164544198e-05}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999881244990143, "res": {"Yes": 0.9999881244990143, "No": 1.07164672951054e-05}, "ground_truth": 1}, {"key": "18725849", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.5742430569077826e-06}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998930056303059, "res": {"Yes": 0.9998930056303059, "No": 0.00010648195753326099}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.1068133768260296e-06, "res": {"No": 0.9999975415208221, "Yes": 2.1068133768260296e-06}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0018924469589884812, "res": {"No": 0.9981074289753733, "Yes": 0.0018924469589884812}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5350677738585172, "res": {"Yes": 0.5350677738585172, "No": 0.4649316841474041}, "ground_truth": 1}, {"key": "36883179", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.02753261436818242, "res": {"No": 0.9724666501329188, "Yes": 0.02753261436818242}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7332780628390906, "res": {"Yes": 0.7332780628390906, "No": 0.26672094951946324}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00015434780932848215, "res": {"No": 0.9998437919917416, "Yes": 0.00015434780932848215}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.014969222786018917, "res": {"No": 0.9850304190525927, "Yes": 0.014969222786018917}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9889305463133188, "res": {"Yes": 0.9889305463133188, "No": 0.011069149106839357}, "ground_truth": 1}, {"key": "34266359", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9734988280720862, "res": {"Yes": 0.9734988280720862, "No": 0.026499693820502757}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.001030018413207394, "res": {"No": 0.9989697464759552, "Yes": 0.001030018413207394}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.136573989308176e-05, "res": {"No": 0.9999886013079656, "Yes": 1.136573989308176e-05}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.04049534701452837, "res": {"No": 0.9595042760542681, "Yes": 0.04049534701452837}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.910059633772693, "res": {"Yes": 0.910059633772693, "No": 0.089939145361764}, "ground_truth": 1}, {"key": "31920289", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.03933701680439018, "res": {"No": 0.9606628798133391, "Yes": 0.03933701680439018}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9523956612273274, "res": {"Yes": 0.9523956612273274, "No": 0.0476036614254632}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0006149909535135565, "res": {"No": 0.9993849688092665, "Yes": 0.0006149909535135565}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0012442840185407514, "res": {"No": 0.9987556619314493, "Yes": 0.0012442840185407514}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8828126458470609, "res": {"Yes": 0.8828126458470609, "No": 0.11718715579942039}, "ground_truth": 1}, {"key": "36292997", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982286933186519, "res": {"Yes": 0.9982286933186519, "No": 0.0017707696436240138}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.36503921237703557, "res": {"No": 0.6349606820740916, "Yes": 0.36503921237703557}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.04992467048012435, "res": {"No": 0.9500752319468819, "Yes": 0.04992467048012435}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9968325400194262, "res": {"Yes": 0.9968325400194262, "No": 0.0031665931028263612}, "ground_truth": 1}, {"key": "30412533", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4773548234256288, "res": {"No": 0.5226442796288426, "Yes": 0.4773548234256288}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.03280980090982348, "res": {"No": 0.9671893798943053, "Yes": 0.03280980090982348}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 7.192497472028463e-05, "res": {"No": 0.999923042191404, "Yes": 7.192497472028463e-05}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.002105442752996071, "res": {"No": 0.9978941917318408, "Yes": 0.002105442752996071}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 2.9977453765522245e-05, "res": {"No": 0.9999663107274963, "Yes": 2.9977453765522245e-05}, "ground_truth": 1}, {"key": "40433191", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.07332343556318738, "res": {"No": 0.9266762956781166, "Yes": 0.07332343556318738}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9133788534192046, "res": {"Yes": 0.9133788534192046, "No": 0.0866208786080637}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00015443164294771507, "res": {"No": 0.9998453414008744, "Yes": 0.00015443164294771507}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.006260238472169149, "res": {"No": 0.9937395651964208, "Yes": 0.006260238472169149}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999928926002577, "res": {"Yes": 0.9999928926002577, "No": 6.8498897548646234e-06}, "ground_truth": 1}, {"key": "34565591", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997002136449121, "res": {"Yes": 0.9997002136449121, "No": 0.00029958181672564495}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9253424349785551, "res": {"Yes": 0.9253424349785551, "No": 0.07465742468472629}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.279523058863262e-07, "res": {"No": 0.9999982567412194, "Yes": 9.279523058863262e-07}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3539853326141878, "res": {"No": 0.6460143576384498, "Yes": 0.3539853326141878}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999716747231683, "res": {"Yes": 0.9999716747231683, "No": 2.8155326578994354e-05}, "ground_truth": 1}, {"key": "36062480", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999975415208221, "res": {"Yes": 0.9999975415208221, "No": 2.354051904215267e-06}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.008620574924094206, "res": {"No": 0.991379308107398, "Yes": 0.008620574924094206}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.119700876622815e-06, "res": {"No": 0.9999950382530095, "Yes": 4.119700876622815e-06}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.05070496724043176, "res": {"No": 0.9492944523966088, "Yes": 0.05070496724043176}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3210312206467016, "res": {"No": 0.6789674708557352, "Yes": 0.3210312206467016}, "ground_truth": 1}, {"key": "37276883", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7505015519670243, "res": {"Yes": 0.7505015519670243, "No": 0.24949684728566485}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9835329922113597, "res": {"Yes": 0.9835329922113597, "No": 0.016466537296089764}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.2225151810566e-05, "res": {"No": 0.9999576091905158, "Yes": 4.2225151810566e-05}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.989891097925134, "res": {"Yes": 0.989891097925134, "No": 0.010107798746226705}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999593971683173, "res": {"Yes": 0.9999593971683173, "No": 4.0362153767111685e-05}, "ground_truth": 1}, {"key": "38509260", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8324254588960376, "res": {"Yes": 0.8324254588960376, "No": 0.1675743241275027}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00236190684740778, "res": {"No": 0.9976380882135137, "Yes": 0.00236190684740778}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.46569638105647665, "res": {"No": 0.5343025112257386, "Yes": 0.46569638105647665}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.2844788127697461, "res": {"No": 0.7155207641010047, "Yes": 0.2844788127697461}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993128224147374, "res": {"Yes": 0.9993128224147374, "No": 0.0006860472877732951}, "ground_truth": 1}, {"key": "37139607", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9934791188267699, "res": {"Yes": 0.9934791188267699, "No": 0.006518732655032104}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.0614187588808342e-05, "res": {"No": 0.9999877668918251, "Yes": 1.0614187588808342e-05}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 2.679985966059989e-06, "res": {"No": 0.9999959918780326, "Yes": 2.679985966059989e-06}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9957692392910595, "res": {"Yes": 0.9957692392910595, "No": 0.004230348083779312}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9741449101674551, "res": {"Yes": 0.9741449101674551, "No": 0.025854531334126074}, "ground_truth": 1}, {"key": "37092824", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6454886190932368, "res": {"Yes": 0.6454886190932368, "No": 0.3545090515675854}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.009780989736545637, "res": {"No": 0.9902185120163183, "Yes": 0.009780989736545637}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.849593784981174e-06, "res": {"No": 0.9999903893441826, "Yes": 8.849593784981174e-06}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 2.038445602715468e-06, "res": {"No": 0.9999965878943212, "Yes": 2.038445602715468e-06}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.277540366653713e-05, "res": {"No": 0.9999071894471658, "Yes": 9.277540366653713e-05}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.43979050080146487, "res": {"No": 0.560209325254278, "Yes": 0.43979050080146487}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.17269877276871584, "res": {"No": 0.8273011605256717, "Yes": 0.17269877276871584}, "ground_truth": 1}, {"key": "39396038", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998728699017159, "res": {"Yes": 0.9998728699017159, "No": 0.00012695079341631406}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9785773771110912, "res": {"Yes": 0.9785773771110912, "No": 0.021421990309539826}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 9.730979488284372e-06, "res": {"No": 0.9999894357248024, "Yes": 9.730979488284372e-06}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9932056357785479, "res": {"Yes": 0.9932056357785479, "No": 0.006794002780402571}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3118032497083029, "res": {"No": 0.6881966523409707, "Yes": 0.3118032497083029}, "ground_truth": 1}, {"key": "39076884", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7579439353450254, "res": {"Yes": 0.7579439353450254, "No": 0.24205575180480543}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.07271505732507198, "res": {"No": 0.9272841351231798, "Yes": 0.07271505732507198}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.009239578603965059, "res": {"No": 0.9907603651931302, "Yes": 0.009239578603965059}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.7617269658786205, "res": {"Yes": 0.7617269658786205, "No": 0.23827135684085582}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9912910842316732, "res": {"Yes": 0.9912910842316732, "No": 0.008707818314785832}, "ground_truth": 1}, {"key": "27763432", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.986514996412938, "res": {"Yes": 0.986514996412938, "No": 0.013483786706520576}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9813840870482762, "res": {"Yes": 0.9813840870482762, "No": 0.018615066486522294}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0005940298424789834, "res": {"No": 0.9994052065597914, "Yes": 0.0005940298424789834}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0007585969115252949, "res": {"No": 0.9992410459514289, "Yes": 0.0007585969115252949}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.03989663876952941, "res": {"No": 0.9601025685383803, "Yes": 0.03989663876952941}, "ground_truth": 1}, {"key": "37806929", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06539197725406477, "res": {"No": 0.9346057652995794, "Yes": 0.06539197725406477}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.039088225322125844, "res": {"No": 0.9609111375671333, "Yes": 0.039088225322125844}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00032918060712315073, "res": {"No": 0.9996704294603056, "Yes": 0.00032918060712315073}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999825220097418, "res": {"Yes": 0.9999825220097418, "No": 1.7169637425880712e-05}, "ground_truth": 1}, {"key": "32334186", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.977080202231482, "res": {"Yes": 0.977080202231482, "No": 0.022919545893646504}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.008321722619225584, "res": {"No": 0.9916776986929594, "Yes": 0.008321722619225584}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00023076538798020253, "res": {"No": 0.9997690731077205, "Yes": 0.00023076538798020253}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0008181867063781109, "res": {"No": 0.9991817732801942, "Yes": 0.0008181867063781109}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0759408523688974, "res": {"No": 0.9240591077130399, "Yes": 0.0759408523688974}, "ground_truth": 1}, {"key": "36187324", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8703297379512159, "res": {"Yes": 0.8703297379512159, "No": 0.12967027456631636}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0005643352884691295, "res": {"No": 0.9994355711499273, "Yes": 0.0005643352884691295}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0007239976582826626, "res": {"No": 0.9992754409197937, "Yes": 0.0007239976582826626}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.06407987672442647, "res": {"No": 0.9359189014577977, "Yes": 0.06407987672442647}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.21388777872212647, "res": {"No": 0.7861115307427726, "Yes": 0.21388777872212647}, "ground_truth": 1}, {"key": "35306009", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0022266523717389885, "res": {"No": 0.9977727701652948, "Yes": 0.0022266523717389885}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00011140425895588994, "res": {"No": 0.9998849006744357, "Yes": 0.00011140425895588994}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9981584919604203, "res": {"Yes": 0.9981584919604203, "No": 0.0018407374492854973}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9844394855338648, "res": {"Yes": 0.9844394855338648, "No": 0.015556939030325338}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9756847254074978, "res": {"Yes": 0.9756847254074978, "No": 0.024313585762228}, "ground_truth": 1}, {"key": "39490050", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9985309729781011, "res": {"Yes": 0.9985309729781011, "No": 0.001467207272139177}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997350039676527, "res": {"Yes": 0.9997350039676527, "No": 0.0002641966092462111}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.10517994854815893, "res": {"No": 0.8948194615444796, "Yes": 0.10517994854815893}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.6117273063355823e-05, "res": {"No": 0.9999835948245663, "Yes": 1.6117273063355823e-05}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0010671599623983251, "res": {"No": 0.9989325114716829, "Yes": 0.0010671599623983251}, "ground_truth": 1}, {"key": "38072149", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 4.40971236938598e-05, "res": {"No": 0.9999557020111849, "Yes": 4.40971236938598e-05}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9882747290967738, "res": {"Yes": 0.9882747290967738, "No": 0.011724225761082684}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.02198472027232034, "res": {"No": 0.9780150172537729, "Yes": 0.02198472027232034}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 7.930789988767533e-07}, "ground_truth": 1}, {"key": "35899689", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9880172518500768, "res": {"Yes": 0.9880172518500768, "No": 0.011981889230761093}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9987875253420897, "res": {"Yes": 0.9987875253420897, "No": 0.0012123684935046156}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.6695202954307989, "res": {"Yes": 0.6695202954307989, "No": 0.3304795822383902}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999807339855921, "res": {"Yes": 0.9999807339855921, "No": 1.9136692356756383e-05}, "ground_truth": 1}, {"key": "27994518", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996438634816706, "res": {"Yes": 0.9996438634816706, "No": 0.0003559388541037128}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9903833575095382, "res": {"Yes": 0.9903833575095382, "No": 0.009616561602235127}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00016479339832480204, "res": {"No": 0.9998327078448934, "Yes": 0.00016479339832480204}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.035002538204276304, "res": {"No": 0.9649962959927495, "Yes": 0.035002538204276304}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0028293867129974494, "res": {"No": 0.9971690685650125, "Yes": 0.0028293867129974494}, "ground_truth": 1}, {"key": "10615479", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9977760931532619, "res": {"Yes": 0.9977760931532619, "No": 0.0022223026298199312}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.10700905734698671, "res": {"No": 0.8929833975926703, "Yes": 0.10700905734698671}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.08778045599388586, "res": {"No": 0.9122192519146309, "Yes": 0.08778045599388586}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.7696208638545452, "res": {"Yes": 0.7696208638545452, "No": 0.2303779633308751}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9922653860658291, "res": {"Yes": 0.9922653860658291, "No": 0.007734043200674898}, "ground_truth": 1}, {"key": "40186667", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06425371730456908, "res": {"No": 0.9357428810259829, "Yes": 0.06425371730456908}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.009224465787005956, "res": {"No": 0.9907751117801495, "Yes": 0.009224465787005956}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.04158322243150545, "res": {"No": 0.9584154855890253, "Yes": 0.04158322243150545}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999932502087799, "res": {"Yes": 0.9999932502087799, "No": 6.652006629609969e-06}, "ground_truth": 1}, {"key": "38622886", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999737011318213, "res": {"Yes": 0.9999737011318213, "No": 2.6113973598196013e-05}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9976199334605379, "res": {"Yes": 0.9976199334605379, "No": 0.0023795532952175327}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.1713646831699337e-05, "res": {"No": 0.9999835948245663, "Yes": 1.1713646831699337e-05}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 4.908005060718017e-06, "res": {"No": 0.9999914621674475, "Yes": 4.908005060718017e-06}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9599074494409848, "res": {"Yes": 0.9599074494409848, "No": 0.04009050723502719}, "ground_truth": 1}, {"key": "40686943", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9960945272733102, "res": {"Yes": 0.9960945272733102, "No": 0.003905285058575251}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991527337329321, "res": {"Yes": 0.9991527337329321, "No": 0.0008467885841151289}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0002408185048737197, "res": {"No": 0.9997581089603562, "Yes": 0.0002408185048737197}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0008331948746505013, "res": {"No": 0.9991664196812675, "Yes": 0.0008331948746505013}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.11940597946574072, "res": {"No": 0.8805926520052789, "Yes": 0.11940597946574072}, "ground_truth": 1}, {"key": "30604567", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.012287846432623577, "res": {"No": 0.9877114026356875, "Yes": 0.012287846432623577}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.015490660268403261, "res": {"No": 0.9845081102488666, "Yes": 0.015490660268403261}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9760349536932745, "res": {"Yes": 0.9760349536932745, "No": 0.023964780634274045}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9692576769082444, "res": {"Yes": 0.9692576769082444, "No": 0.03074152292411885}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999798995780161, "res": {"Yes": 0.9999798995780161, "No": 1.994428344101682e-05}, "ground_truth": 1}, {"key": "35440903", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998176908203386, "res": {"Yes": 0.9998176908203386, "No": 0.00018214818479498683}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9944356781067087, "res": {"Yes": 0.9944356781067087, "No": 0.005564011155391294}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.7512682053615413, "res": {"Yes": 0.7512682053615413, "No": 0.24873054924268534}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.002531398404220945, "res": {"No": 0.9974680933961255, "Yes": 0.002531398404220945}, "ground_truth": 1}, {"key": "37219533", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1738808299071461, "res": {"No": 0.8261158673968243, "Yes": 0.1738808299071461}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.12490180629820175, "res": {"No": 0.8750979902829594, "Yes": 0.12490180629820175}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.02724472648737597, "res": {"No": 0.9727543259431419, "Yes": 0.02724472648737597}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.14254392231408983, "res": {"No": 0.8574555483025003, "Yes": 0.14254392231408983}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999714363229496, "res": {"Yes": 0.9999714363229496, "No": 2.8463542502965878e-05}, "ground_truth": 1}, {"key": "40178965", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.31946453911809675, "res": {"No": 0.6805352214755336, "Yes": 0.31946453911809675}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7183424311633521, "res": {"Yes": 0.7183424311633521, "No": 0.2816569888488133}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.026835860702239738, "res": {"No": 0.9731631748795536, "Yes": 0.026835860702239738}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 8.203045313083854e-05, "res": {"No": 0.9999174400582596, "Yes": 8.203045313083854e-05}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9892966489032492, "res": {"Yes": 0.9892966489032492, "No": 0.010702017541587923}, "ground_truth": 1}, {"key": "13750468", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9288534805418979, "res": {"Yes": 0.9288534805418979, "No": 0.07114539350297922}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.016790198255688706, "res": {"No": 0.9832090619310033, "Yes": 0.016790198255688706}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.3795364789995834e-06, "res": {"No": 0.9999981375378344, "Yes": 1.3795364789995834e-06}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9897044636357385, "res": {"Yes": 0.9897044636357385, "No": 0.010294724494068538}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5836295322690289, "res": {"Yes": 0.5836295322690289, "No": 0.4163699545933046}, "ground_truth": 1}, {"key": "17754949", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.27540445950226583, "res": {"No": 0.7245955078715571, "Yes": 0.27540445950226583}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.08633093381375755, "res": {"No": 0.9136683490460125, "Yes": 0.08633093381375755}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.008400153495718517, "res": {"No": 0.9915990439206652, "Yes": 0.008400153495718517}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 7.915773900340995e-05, "res": {"No": 0.999920539107184, "Yes": 7.915773900340995e-05}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00253641274832947, "res": {"No": 0.9974631139480854, "Yes": 0.00253641274832947}, "ground_truth": 1}, {"key": "36675623", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00014888624499641002, "res": {"No": 0.9998508202684029, "Yes": 0.00014888624499641002}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.000276135188157801, "res": {"No": 0.9997235671645989, "Yes": 0.000276135188157801}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0007861208690030687, "res": {"No": 0.9992137913241281, "Yes": 0.0007861208690030687}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 7.974847011454522e-05, "res": {"No": 0.9999152945777069, "Yes": 7.974847011454522e-05}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9935088876823824, "res": {"Yes": 0.9935088876823824, "No": 0.0064910498311491335}, "ground_truth": 1}, {"key": "40035440", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0016980302095446116, "res": {"No": 0.9983018599741527, "Yes": 0.0016980302095446116}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998883571925221, "res": {"Yes": 0.9998883571925221, "No": 0.00011129079583529187}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.004594331582607564, "res": {"No": 0.9954049516870341, "Yes": 0.004594331582607564}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0008564280058073365, "res": {"No": 0.9991422674030854, "Yes": 0.0008564280058073365}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999193471666147, "res": {"Yes": 0.9999193471666147, "No": 8.045649133197866e-05}, "ground_truth": 1}, {"key": "37685909", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.98952806057902, "res": {"Yes": 0.98952806057902, "No": 0.010471682183544996}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9943048397631601, "res": {"Yes": 0.9943048397631601, "No": 0.005694969714543164}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981890128197926, "res": {"Yes": 0.9981890128197926, "No": 0.0018103483385199294}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 4.3401467068312096e-07}, "ground_truth": 1}, {"key": "36938787", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999135066767632, "res": {"Yes": 0.9999135066767632, "No": 8.580081952007052e-05}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990819360787868, "res": {"Yes": 0.9990819360787868, "No": 0.0009173953908116016}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9926961134743978, "res": {"Yes": 0.9926961134743978, "No": 0.007303412312320143}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.005103633714067754, "res": {"No": 0.9948963680115798, "Yes": 0.005103633714067754}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9824589846631778, "res": {"Yes": 0.9824589846631778, "No": 0.017540413809229553}, "ground_truth": 1}, {"key": "39398068", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.10663642795165652, "res": {"No": 0.8933634250099777, "Yes": 0.10663642795165652}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998986076205548, "res": {"Yes": 0.9998986076205548, "No": 0.00010127803514334788}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991419100699088, "res": {"Yes": 0.9991419100699088, "No": 0.0008579157987045645}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999976607241361, "res": {"Yes": 0.9999976607241361, "No": 2.1213667152300353e-06}, "ground_truth": 1}, {"key": "39926408", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, " Yes": 1.1062342179278421e-07}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 8.803027099897201e-07}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00022093986445780256, "res": {"No": 0.999777296302151, "Yes": 0.00022093986445780256}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.02699332407586954, "res": {"No": 0.9730060518804572, "Yes": 0.02699332407586954}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.010296196744934621, "res": {"No": 0.9897028306247208, "Yes": 0.010296196744934621}, "ground_truth": 1}, {"key": "40465336", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00015114559203734633, "res": {"No": 0.9998485557488386, "Yes": 0.00015114559203734633}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 8.327110064653079e-05, "res": {"No": 0.9999166057074973, "Yes": 8.327110064653079e-05}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.5836977566187747e-05, "res": {"No": 0.9999837140256179, "Yes": 1.5836977566187747e-05}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.43798964957159064, "res": {"No": 0.5620102448410834, "Yes": 0.43798964957159064}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6343916568457169, "res": {"Yes": 0.6343916568457169, "No": 0.36560564468899837}, "ground_truth": 1}, {"key": "34173549", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6997927284499541, "res": {"Yes": 0.6997927284499541, "No": 0.3002042808173109}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9280386345540248, "res": {"Yes": 0.9280386345540248, "No": 0.0719609549083257}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.7293004441379641, "res": {"Yes": 0.7293004441379641, "No": 0.2706992101965135}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0029203406749613286, "res": {"No": 0.9970795664869067, "Yes": 0.0029203406749613286}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.12977708903987817, "res": {"No": 0.8702228332124295, "Yes": 0.12977708903987817}, "ground_truth": 1}, {"key": "33541535", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9883713742429504, "res": {"Yes": 0.9883713742429504, "No": 0.011628313917045163}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.3344033432715325, "res": {"No": 0.6655963188928312, "Yes": 0.3344033432715325}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.04103817286270342, "res": {"No": 0.9589614337261461, "Yes": 0.04103817286270342}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.015288132578786065, "res": {"No": 0.9847115321141139, "Yes": 0.015288132578786065}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7142252572881161, "res": {"Yes": 0.7142252572881161, "No": 0.28577414012440716}, "ground_truth": 1}, {"key": "35685195", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9901450009227517, "res": {"Yes": 0.9901450009227517, "No": 0.00985459928785666}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8783949564409629, "res": {"Yes": 0.8783949564409629, "No": 0.12160412345904029}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 8.614841442300872e-05, "res": {"No": 0.99991362587046, "Yes": 8.614841442300872e-05}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9831043252653767, "res": {"Yes": 0.9831043252653767, "No": 0.016893252451580146}, "ground_truth": 1}, {"key": "28440730", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.06659332045060407, "res": {"No": 0.9334059788815069, "Yes": 0.06659332045060407}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7844875005112781, "res": {"Yes": 0.7844875005112781, "No": 0.21551096264279046}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.04382190817533052, "res": {"No": 0.9561773247413902, "Yes": 0.04382190817533052}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.17689187655224534, "res": {"No": 0.8231074564995869, "Yes": 0.17689187655224534}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5290909149400218, "res": {"Yes": 0.5290909149400218, "No": 0.47090822751076883}, "ground_truth": 1}, {"key": "38338714", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9949369576266671, "res": {"Yes": 0.9949369576266671, "No": 0.005061998060541668}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.07360797523106505, "res": {"No": 0.9263911873500963, "Yes": 0.07360797523106505}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.002159388066435449, "res": {"No": 0.9978387518672682, "Yes": 0.002159388066435449}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999056399421903, "res": {"Yes": 0.9999056399421903, "No": 9.302721250794172e-05}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999770387506135, "res": {"Yes": 0.9999770387506135, "No": 2.1228689772581162e-05}, "ground_truth": 1}, {"key": "32191881", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7864605080610352, "res": {"Yes": 0.7864605080610352, "No": 0.21353831522558342}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999697675220106, "res": {"Yes": 0.9999697675220106, "No": 2.9573348226180062e-05}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0990843471670496, "res": {"No": 0.9009150949985212, "Yes": 0.0990843471670496}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997724100525223, "res": {"Yes": 0.9997724100525223, "No": 0.00022739976728983733}, "ground_truth": 1}, {"key": "37707251", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0695921016584601, "res": {"No": 0.9304077351709099, "Yes": 0.0695921016584601}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.12206048236569121, "res": {"No": 0.8779392579759161, "Yes": 0.12206048236569121}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.079235848202198e-05, "res": {"No": 0.9999683371212795, "Yes": 3.079235848202198e-05}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0008565202480707187, "res": {"No": 0.9991429819898906, "Yes": 0.0008565202480707187}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5145277959485962, "res": {"Yes": 0.5145277959485962, "No": 0.4854699442326098}, "ground_truth": 1}, {"key": "40172567", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9819754931481754, "res": {"Yes": 0.9819754931481754, "No": 0.01802362286710554}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7863870088966212, "res": {"Yes": 0.7863870088966212, "No": 0.2136120413764008}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.001742117415718178, "res": {"No": 0.9982577956030773, "Yes": 0.001742117415718178}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9650005130357772, "res": {"Yes": 0.9650005130357772, "No": 0.03499841514812862}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999254260847726, "res": {"Yes": 0.9999254260847726, "No": 7.432159518136892e-05}, "ground_truth": 1}, {"key": "33113255", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9977188873009254, "res": {"Yes": 0.9977188873009254, "No": 0.002280855470564874}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9864089813430954, "res": {"Yes": 0.9864089813430954, "No": 0.013590625845041589}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.2879147852460814e-05, "res": {"No": 0.9999865748701179, "Yes": 1.2879147852460814e-05}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.030431728931793453, "res": {"No": 0.9695642928755107, "Yes": 0.030431728931793453}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998584218565489, "res": {"Yes": 0.998584218565489, "No": 0.0014155091348346137}, "ground_truth": 1}, {"key": "33022143", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992051036975867, "res": {"Yes": 0.9992051036975867, "No": 0.0007940130985014485}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996985453065997, "res": {"Yes": 0.9996985453065997, "No": 0.00030076118904331006}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.005362001282420953, "res": {"No": 0.994638020009377, "Yes": 0.005362001282420953}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.988978003756583, "res": {"Yes": 0.988978003756583, "No": 0.011021603253950265}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980240744162966, "res": {"Yes": 0.9980240744162966, "No": 0.0019752197914714173}, "ground_truth": 1}, {"key": "32084473", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998074449011132, "res": {"Yes": 0.9998074449011132, "No": 0.00019210201479181915}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999967070975216, "res": {"Yes": 0.9999967070975216, "No": 2.6751476041958026e-06}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00020611835815855526, "res": {"No": 0.9997895679539296, "Yes": 0.00020611835815855526}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.003743394720385279, "res": {"No": 0.996255759813821, "Yes": 0.003743394720385279}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5040262343417821, "res": {"Yes": 0.5040262343417821, "No": 0.49597170512666294}, "ground_truth": 1}, {"key": "40564245", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3517870000617563, "res": {"No": 0.6482112971060984, "Yes": 0.3517870000617563}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990289808744778, "res": {"Yes": 0.9990289808744778, "No": 0.0009692553128743397}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0002263045272502825, "res": {"No": 0.9997733634559426, "Yes": 0.0002263045272502825}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.01862399455123503, "res": {"No": 0.9813753625825227, "Yes": 0.01862399455123503}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993534181242099, "res": {"Yes": 0.9993534181242099, "No": 0.0006458656809673849}, "ground_truth": 1}, {"key": "31717213", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9874348214303796, "res": {"Yes": 0.9874348214303796, "No": 0.012564360558122782}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8732047365171494, "res": {"Yes": 0.8732047365171494, "No": 0.12679483135428418}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.07405220215151372, "res": {"No": 0.92594719574071, "Yes": 0.07405220215151372}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.6590343179756136, "res": {"Yes": 0.6590343179756136, "No": 0.3409647089055452}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9332016226821042, "res": {"Yes": 0.9332016226821042, "No": 0.06679752166173647}, "ground_truth": 1}, {"key": "34861894", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5328824623787385, "res": {"Yes": 0.5328824623787385, "No": 0.4671168212624177}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.028919371913340815, "res": {"No": 0.971079742464987, "Yes": 0.028919371913340815}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.8791595892856126, "res": {"Yes": 0.8791595892856126, "No": 0.12084023231073268}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.20245610122716245, "res": {"No": 0.7975437315716867, "Yes": 0.20245610122716245}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.758052374560888, "res": {"Yes": 0.758052374560888, "No": 0.24194728672568644}, "ground_truth": 1}, {"key": "40838760", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8965151383702876, "res": {"Yes": 0.8965151383702876, "No": 0.10348464859823327}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.993434882173459, "res": {"Yes": 0.993434882173459, "No": 0.006565021475642858}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 7.128063872795947e-07, "res": {"No": 0.9999988527586581, "Yes": 7.128063872795947e-07}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9031520866433952, "res": {"Yes": 0.9031520866433952, "No": 0.09684708380606125}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.011639058788997, "res": {"No": 0.9883605476822142, "Yes": 0.011639058788997}, "ground_truth": 1}, {"key": "40044849", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9935818429236876, "res": {"Yes": 0.9935818429236876, "No": 0.0064167174029144914}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.006397018221970882, "res": {"No": 0.9936029127455734, "Yes": 0.006397018221970882}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.446937059545041e-06, "res": {"No": 0.9999951574563252, "Yes": 4.446937059545041e-06}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.2705105715347301, "res": {"No": 0.7294875118104698, "Yes": 0.2705105715347301}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991861764741429, "res": {"Yes": 0.9991861764741429, "No": 0.0008133919998364443}, "ground_truth": 1}, {"key": "30296116", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.843951205032505, "res": {"Yes": 0.843951205032505, "No": 0.15604741119338153}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.11732418075777705, "res": {"No": 0.8826755380349762, "Yes": 0.11732418075777705}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.7930949177465135, "res": {"Yes": 0.7930949177465135, "No": 0.20690459203727754}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9614297534083116, "res": {"Yes": 0.9614297534083116, "No": 0.03856957599314098}, "ground_truth": 1}, {"key": "34931360", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5444007339632021, "res": {"Yes": 0.5444007339632021, "No": 0.45559840877836927}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.09751719086072597, "res": {"No": 0.9024824490501879, "Yes": 0.09751719086072597}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.6053736897146354e-06, "res": {"No": 0.9999982567412194, "Yes": 1.6053736897146354e-06}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9623356169408324, "res": {"Yes": 0.9623356169408324, "No": 0.03766345191385437}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9978668879240878, "res": {"Yes": 0.9978668879240878, "No": 0.0021329597709177773}, "ground_truth": 1}, {"key": "18862422", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999297171049584, "res": {"Yes": 0.9999297171049584, "No": 7.020865246784626e-05}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994367589298377, "res": {"Yes": 0.9994367589298377, "No": 0.000563015443203042}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 9.30208490125181e-06, "res": {"No": 0.9999906277489198, "Yes": 9.30208490125181e-06}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0300234386610931e-06, "res": {"No": 0.9999981375378344, "Yes": 1.0300234386610931e-06}, "ground_truth": 1}, {"key": "36361140", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9940760183863, "res": {"Yes": 0.9940760183863, "No": 0.005922583637728884}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 1.64533590010354e-06, "res": {"No": 0.9999964686909351, "Yes": 1.64533590010354e-06}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.2201680832604233e-06, "res": {"No": 0.9999947998470209, "Yes": 3.2201680832604233e-06}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0007473912860490932, "res": {"No": 0.9992523580236433, "Yes": 0.0007473912860490932}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990411169224735, "res": {"Yes": 0.9990411169224735, "No": 0.0009587022605034894}, "ground_truth": 1}, {"key": "39703329", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2764354884693771, "res": {"No": 0.7235640563963258, "Yes": 0.2764354884693771}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.00328191232685437, "res": {"No": 0.9967181221728459, "Yes": 0.00328191232685437}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.074496906372656e-06, "res": {"No": 0.9999982567412194, "Yes": 1.074496906372656e-06}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.012390494164450459, "res": {"No": 0.9876086114267185, "Yes": 0.012390494164450459}, "ground_truth": 1}, {"key": "34033324", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 2.0080790286737813e-06, "res": {"No": 0.9999977799274644, "Yes": 2.0080790286737813e-06}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0001299025505190135, "res": {"No": 0.9998690558739306, "Yes": 0.0001299025505190135}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.282741720913756e-05, "res": {"No": 0.9999353192918872, "Yes": 6.282741720913756e-05}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0061113761623837045, "res": {"No": 0.9938882849778699, "Yes": 0.0061113761623837045}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.03266957376935084, "res": {"No": 0.9673303541506348, "Yes": 0.03266957376935084}, "ground_truth": 1}, {"key": "35658862", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.11670029638215583, "res": {"No": 0.8832996548338543, "Yes": 0.11670029638215583}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7757925476825841, "res": {"Yes": 0.7757925476825841, "No": 0.22420732436237895}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.208634316289876e-06, "res": {"No": 0.99999861435166, "Yes": 1.208634316289876e-06}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8964160699564724, "res": {"Yes": 0.8964160699564724, "No": 0.10358378260209655}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.02106272265011684, "res": {"No": 0.9789371105231914, "Yes": 0.02106272265011684}, "ground_truth": 1}, {"key": "36092657", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9436792435041625, "res": {"Yes": 0.9436792435041625, "No": 0.056320628936405666}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.07017896898105708, "res": {"No": 0.9298201208346157, "Yes": 0.07017896898105708}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 4.824347367256777e-05, "res": {"No": 0.9999514108804896, "Yes": 4.824347367256777e-05}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0007352323398969014, "res": {"No": 0.9992646159774662, "Yes": 0.0007352323398969014}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.990946103603934, "res": {"Yes": 0.990946103603934, "No": 0.009053583796900131}, "ground_truth": 1}, {"key": "26333438", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0007125382236730573, "res": {"No": 0.9992872261840283, "Yes": 0.0007125382236730573}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.010831962768445927, "res": {"No": 0.989167504655809, "Yes": 0.010831962768445927}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.016852487617405706, "res": {"No": 0.9831347439668948, "Yes": 0.016852487617405706}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9966301369767532, "res": {"Yes": 0.9966301369767532, "No": 0.003368627121381461}, "ground_truth": 1}, {"key": "34184963", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980399833462462, "res": {"Yes": 0.9980399833462462, "No": 0.0019591066509016693}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.6601663237684489, "res": {"Yes": 0.6601663237684489, "No": 0.3398323062347634}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.5207685644648786, "res": {"Yes": 0.5207685644648786, "No": 0.47923135612692475}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0006325756751585416, "res": {"No": 0.9993673450405961, "Yes": 0.0006325756751585416}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8384323338677178, "res": {"Yes": 0.8384323338677178, "No": 0.16156760776275245}, "ground_truth": 1}, {"key": "35069975", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.49949927117684934, "res": {"No": 0.5005006407539544, "Yes": 0.49949927117684934}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982226319926057, "res": {"Yes": 0.9982226319926057, "No": 0.0017773096333445952}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.5306608267316572e-05, "res": {"No": 0.9999740587314805, "Yes": 2.5306608267316572e-05}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999719131244437, "res": {"Yes": 0.9999719131244437, "No": 2.793358024118998e-05}, "ground_truth": 1}, {"key": "36443950", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999958726752174, "res": {"Yes": 0.9999958726752174, "No": 3.6796129056434393e-06}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00010114473976533728, "res": {"No": 0.9998982500468776, "Yes": 0.00010114473976533728}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.5976204054980978, "res": {"Yes": 0.5976204054980978, "No": 0.4023775306904616}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999907469518097, "res": {"Yes": 0.9999907469518097, "No": 8.988675955743872e-06}, "ground_truth": 1}, {"key": "29460858", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004108291624600851, "res": {"No": 0.9958913596534422, "Yes": 0.004108291624600851}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0012901041853920195, "res": {"No": 0.9987096435267642, "Yes": 0.0012901041853920195}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00011834328051496789, "res": {"No": 0.9998807290433461, "Yes": 0.00011834328051496789}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0002201496534318896, "res": {"No": 0.9997797990277938, "Yes": 0.0002201496534318896}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99965303526619, "res": {"Yes": 0.99965303526619, "No": 0.0003467840520951757}, "ground_truth": 1}, {"key": "36155704", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8156523715872455, "res": {"Yes": 0.8156523715872455, "No": 0.1843471894769949}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.4917941718111165, "res": {"No": 0.5082054418835605, "Yes": 0.4917941718111165}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.42958740679888313, "res": {"No": 0.5704105809508592, "Yes": 0.42958740679888313}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.999581450616242, "res": {"Yes": 0.999581450616242, "No": 0.000418139855024946}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9962084332103458, "res": {"Yes": 0.9962084332103458, "No": 0.003790852693882134}, "ground_truth": 1}, {"key": "37185211", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992130766866801, "res": {"Yes": 0.9992130766866801, "No": 0.0007863782084748003}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998992035803005, "res": {"Yes": 0.9998992035803005, "No": 0.00010022950014696968}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0001015483010764033, "res": {"No": 0.9998977732755078, "Yes": 0.0001015483010764033}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9950050494622391, "res": {"Yes": 0.9950050494622391, "No": 0.004994310072725692}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999920581810364, "res": {"Yes": 0.9999920581810364, "No": 7.682235288210778e-06}, "ground_truth": 1}, {"key": "36454885", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999995276659155, "res": {"Yes": 0.999995276659155, "No": 4.081867310936403e-06}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.4629056818508746e-07}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00016565123065459417, "res": {"No": 0.9998336613158132, "Yes": 0.00016565123065459417}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9256721469474735, "res": {"Yes": 0.9256721469474735, "No": 0.07432591495366361}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.029609882651912885, "res": {"No": 0.9703899072639542, "Yes": 0.029609882651912885}, "ground_truth": 1}, {"key": "33148906", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9344926007391459, "res": {"Yes": 0.9344926007391459, "No": 0.06550614001809789}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9391790747709889, "res": {"Yes": 0.9391790747709889, "No": 0.060818850314162544}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0001474014118347737, "res": {"No": 0.9998492708507798, "Yes": 0.0001474014118347737}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.14794260270504253, "res": {"No": 0.8520559800731893, "Yes": 0.14794260270504253}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.82993895424398, "res": {"Yes": 0.82993895424398, "No": 0.1700570006823944}, "ground_truth": 1}, {"key": "18086604", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.043110327215759386, "res": {"No": 0.9568883442605209, "Yes": 0.043110327215759386}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.007683124335737544, "res": {"No": 0.9923160960918501, "Yes": 0.007683124335737544}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.7344918089169133e-05, "res": {"No": 0.9999822836059372, "Yes": 1.7344918089169133e-05}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0014616227322961132, "res": {"No": 0.9985379738031475, "Yes": 0.0014616227322961132}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00021460273139632565, "res": {"No": 0.9997844469448988, "Yes": 0.00021460273139632565}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.005107271348842526, "res": {"No": 0.9948917609556354, "Yes": 0.005107271348842526}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998193593674841, "res": {"Yes": 0.9998193593674841, "No": 0.00017912798636392403}, "ground_truth": 1}, {"key": "39501530", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9644033008335356, "res": {"Yes": 0.9644033008335356, "No": 0.03559578667336704}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998101860569464, "res": {"Yes": 0.9998101860569464, "No": 0.00018896854222723265}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00014949628723356635, "res": {"No": 0.9998491516787523, "Yes": 0.00014949628723356635}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8444787296219739, "res": {"Yes": 0.8444787296219739, "No": 0.15552076800164796}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9958112033846658, "res": {"Yes": 0.9958112033846658, "No": 0.004188406196955855}, "ground_truth": 1}, {"key": "30948874", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9924432560508011, "res": {"Yes": 0.9924432560508011, "No": 0.007555806035004372}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9708079005284515, "res": {"Yes": 0.9708079005284515, "No": 0.029191322165192286}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.003090423940223078, "res": {"No": 0.9969094233947909, "Yes": 0.003090423940223078}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.601711430456554, "res": {"Yes": 0.601711430456554, "No": 0.3982884450044777}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999676219241812, "res": {"Yes": 0.9999676219241812, "No": 3.211285951841413e-05}, "ground_truth": 1}, {"key": "39410675", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.032817436638877824, "res": {"No": 0.9671820138080381, "Yes": 0.032817436638877824}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9904030059198696, "res": {"Yes": 0.9904030059198696, "No": 0.00959472702155134}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.8191688011138086, "res": {"Yes": 0.8191688011138086, "No": 0.18083105163533847}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7724240439718391, "res": {"Yes": 0.7724240439718391, "No": 0.22757593865568357}, "ground_truth": 1}, {"key": "32903337", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5923595562116568, "res": {"Yes": 0.5923595562116568, "No": 0.40763985611192843}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.2649194927754763, "res": {"No": 0.7350801265476447, "Yes": 0.2649194927754763}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.3342404282198324, "res": {"No": 0.6657594765447453, "Yes": 0.3342404282198324}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 5.504668029859564e-05, "res": {"No": 0.9999447358231209, "Yes": 5.504668029859564e-05}, "ground_truth": 1}, {"key": "27685132", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990451659843832, "res": {"Yes": 0.9990451659843832, "No": 0.0009547099317578454}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8871646608183117, "res": {"Yes": 0.8871646608183117, "No": 0.11283507947629266}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.1256478008087796e-06, "res": {"No": 0.9999942038320978, "Yes": 3.1256478008087796e-06}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00015955067094745607, "res": {"No": 0.9998402164567504, "Yes": 0.00015955067094745607}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8185072127937006, "res": {"Yes": 0.8185072127937006, "No": 0.18149256324017815}, "ground_truth": 1}, {"key": "22791471", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9172565416180289, "res": {"Yes": 0.9172565416180289, "No": 0.08274336079734354}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 8.256101955831688e-06, "res": {"No": 0.9999893165220688, "Yes": 8.256101955831688e-06}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0024638502754271477, "res": {"No": 0.9975340513590105, "Yes": 0.0024638502754271477}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1296477139013766, "res": {"No": 0.8703508698137932, "Yes": 0.1296477139013766}, "ground_truth": 1}, {"key": "32292348", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995433331340693, "res": {"Yes": 0.9995433331340693, "No": 0.00045493786899349444}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.697369506670754, "res": {"Yes": 0.697369506670754, "No": 0.3026288323837157}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.0778678807291234e-05, "res": {"No": 0.9999475965531086, "Yes": 5.0778678807291234e-05}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997427465353486, "res": {"Yes": 0.9997427465353486, "No": 0.0002569250884986375}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986725483444392, "res": {"Yes": 0.9986725483444392, "No": 0.0013269409811722337}, "ground_truth": 1}, {"key": "20482930", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993144864718347, "res": {"Yes": 0.9993144864718347, "No": 0.0006851109924871457}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998156683911591, "res": {"Yes": 0.9998156683911591, "No": 0.0001839009979092079}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 3.381851920660056e-05, "res": {"No": 0.9999658339276736, "Yes": 3.381851920660056e-05}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999857404566682, "res": {"Yes": 0.9999857404566682, "No": 1.4175208492401031e-05}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999908661547138, "res": {"Yes": 0.9999908661547138, "No": 9.104333946127678e-06}, "ground_truth": 1}, {"key": "11635754", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.628143894498183e-07}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998528464381476, "res": {"Yes": 0.9998528464381476, "No": 0.00014711146400218846}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.017933595170564448, "res": {"No": 0.9820664292711394, "Yes": 0.017933595170564448}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995676361961799, "res": {"Yes": 0.9995676361961799, "No": 0.00043224975508759716}, "ground_truth": 1}, {"key": "40029096", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9838803193537751, "res": {"Yes": 0.9838803193537751, "No": 0.016119707294144414}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993271097922245, "res": {"Yes": 0.9993271097922245, "No": 0.0006727888647849126}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.00113239377716942, "res": {"No": 0.9988666185624507, "Yes": 0.00113239377716942}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0005740936624249123, "res": {"No": 0.9994253291465832, "Yes": 0.0005740936624249123}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.44998636350461696, "res": {"No": 0.5500134755806716, "Yes": 0.44998636350461696}, "ground_truth": 1}, {"key": "40414719", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9944220011302204, "res": {"Yes": 0.9944220011302204, "No": 0.005577492368075412}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7384251767631249, "res": {"Yes": 0.7384251767631249, "No": 0.26157469388288707}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.4782405425496208e-06, "res": {"No": 0.9999964686909351, "Yes": 1.4782405425496208e-06}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.018000633990712354, "res": {"No": 0.9819992916126286, "Yes": 0.018000633990712354}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1756654227945312, "res": {"No": 0.8243333499261994, "Yes": 0.1756654227945312}, "ground_truth": 1}, {"key": "39537616", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.004114819951509575, "res": {"No": 0.9958849710308616, "Yes": 0.004114819951509575}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.06026137064615953, "res": {"No": 0.9397382687396678, "Yes": 0.06026137064615953}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9819437699603212, "res": {"Yes": 0.9819437699603212, "No": 0.01805517737775408}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6968348084290638, "res": {"Yes": 0.6968348084290638, "No": 0.30316141274050534}, "ground_truth": 1}, {"key": "33245830", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9972601096697487, "res": {"Yes": 0.9972601096697487, "No": 0.0027384768700160346}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 6.31433571059341e-06, "res": {"No": 0.9999877668918251, "Yes": 6.31433571059341e-06}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.002587102643274532, "res": {"No": 0.9974109342271066, "Yes": 0.002587102643274532}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998834704001013, "res": {"Yes": 0.9998834704001013, "No": 0.00011576202299788399}, "ground_truth": 1}, {"key": "39243601", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6479551746146198, "res": {"Yes": 0.6479551746146198, "No": 0.35204129321305155}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.4023112645683219, "res": {"No": 0.5976884185701139, "Yes": 0.4023112645683219}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9936063254793587, "res": {"Yes": 0.9936063254793587, "No": 0.006389759808201674}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999015874128364, "res": {"Yes": 0.9999015874128364, "No": 9.75034301064812e-05}, "ground_truth": 1}, {"key": "35815905", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.5979691758683565e-06}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999614235510903, "res": {"Yes": 0.9999614235510903, "No": 3.826851739253479e-05}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.1421261371317681e-06, "res": {"No": 0.9999982567412194, "Yes": 1.1421261371317681e-06}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.15988290107114567, "res": {"No": 0.8401170933620784, "Yes": 0.15988290107114567}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3495153494362916, "res": {"No": 0.6504845840024123, "Yes": 0.3495153494362916}, "ground_truth": 1}, {"key": "35260212", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.46378193727147166, "res": {"No": 0.5362179915170997, "Yes": 0.46378193727147166}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.6603536065063044, "res": {"Yes": 0.6603536065063044, "No": 0.33964612914812764}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.00792871340903137, "res": {"No": 0.9920707109877498, "Yes": 0.00792871340903137}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.316345791602542e-06}, "ground_truth": 1}, {"key": "39193924", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999956342685299, "res": {"Yes": 0.9999956342685299, "No": 4.079651458644905e-06}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998536807357079, "res": {"Yes": 0.9998536807357079, "No": 0.00014546035248460908}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 1.0197591428693394e-05, "res": {"No": 0.9999869324773808, "Yes": 1.0197591428693394e-05}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.019682251271962097, "res": {"No": 0.9803158875709241, "Yes": 0.019682251271962097}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9001359243551383, "res": {"Yes": 0.9001359243551383, "No": 0.09986002735262378}, "ground_truth": 1}, {"key": "40658569", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5417774883153039, "res": {"Yes": 0.5417774883153039, "No": 0.4582176909682411}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9163954990233764, "res": {"Yes": 0.9163954990233764, "No": 0.08360089108807682}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0066866886331814574, "res": {"No": 0.9933127736825623, "Yes": 0.0066866886331814574}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8088780054653408, "res": {"Yes": 0.8088780054653408, "No": 0.1911209892329112}, "ground_truth": 1}, {"key": "33497596", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5346778836759798, "res": {"Yes": 0.5346778836759798, "No": 0.4653218789815751}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.8840184637213515, "res": {"Yes": 0.8840184637213515, "No": 0.11598009470163372}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0033753913696596763, "res": {"No": 0.9966240929316146, "Yes": 0.0033753913696596763}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9173884562624393, "res": {"Yes": 0.9173884562624393, "No": 0.08261016855825398}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984543122077647, "res": {"Yes": 0.9984543122077647, "No": 0.0015451484331668727}, "ground_truth": 1}, {"key": "40339241", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.27721985146471273, "res": {"No": 0.722779877718966, "Yes": 0.27721985146471273}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.1143356566656446, "res": {"No": 0.885664046771502, "Yes": 0.1143356566656446}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.1216579816882399, "res": {"No": 0.8783415253008872, "Yes": 0.1216579816882399}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999874092852638, "res": {"Yes": 0.9999874092852638, "No": 1.2146366334822457e-05}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998354490699897, "res": {"Yes": 0.9998354490699897, "No": 0.00016253673828390517}, "ground_truth": 1}, {"key": "31792608", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, " Yes": 5.941696216585883e-07}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.7760395605563268, "res": {"Yes": 0.7760395605563268, "No": 0.22395984647579614}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.4849306150652946, "res": {"No": 0.5150690292098076, "Yes": 0.4849306150652946}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.03291663914403326, "res": {"No": 0.9670831206345957, "Yes": 0.03291663914403326}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999947998470209, "res": {"Yes": 0.9999947998470209, "No": 4.9476789022107765e-06}, "ground_truth": 1}, {"key": "33132662", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998442687373722, "res": {"Yes": 0.9998442687373722, "No": 0.00015541493777067284}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.009838946860673724, "res": {"No": 0.9901610077362193, "Yes": 0.009838946860673724}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 6.4939732725928346e-06, "res": {"No": 0.9999897933310884, "Yes": 6.4939732725928346e-06}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999924157887603, "res": {"Yes": 0.9999924157887603, "No": 7.183391016325141e-06}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999987335551019, "res": {"Yes": 0.9999987335551019, "No": 9.73089281477812e-07}, "ground_truth": 1}, {"key": "37577457", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998795371462323, "res": {"Yes": 0.9998795371462323, "No": 0.00012002145974047396}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 2.8406603932165427e-06}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.4281870697655599, "res": {"No": 0.5718116300121783, "Yes": 0.4281870697655599}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.0024929525697318998, "res": {"No": 0.9975061700734058, "Yes": 0.0024929525697318998}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2710177126245856, "res": {"No": 0.728981270024282, "Yes": 0.2710177126245856}, "ground_truth": 1}, {"key": "38701278", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.40041694990780036, "res": {"No": 0.5995810006281357, "Yes": 0.40041694990780036}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 9.24152083803153e-05, "res": {"No": 0.9999068318704197, "Yes": 9.24152083803153e-05}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0004883874071237705, "res": {"No": 0.9995114272905351, "Yes": 0.0004883874071237705}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9896478373354517, "res": {"Yes": 0.9896478373354517, "No": 0.010351686765885692}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999707211216348, "res": {"Yes": 0.9999707211216348, "No": 2.9078310655165097e-05}, "ground_truth": 1}, {"key": "34570783", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996151606896513, "res": {"Yes": 0.9996151606896513, "No": 0.0003843988010075816}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9986085918072474, "res": {"Yes": 0.9986085918072474, "No": 0.0013912230870501117}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0009339982438345444, "res": {"No": 0.9990659886004412, "Yes": 0.0009339982438345444}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.11313446635238383, "res": {"No": 0.8868654617708233, "Yes": 0.11313446635238383}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.36138908618259175, "res": {"No": 0.6386106191770408, "Yes": 0.36138908618259175}, "ground_truth": 1}, {"key": "39064526", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9467171826163613, "res": {"Yes": 0.9467171826163613, "No": 0.05328232586928511}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.020294016298630285, "res": {"No": 0.9797058690392998, "Yes": 0.020294016298630285}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0015296189911223467, "res": {"No": 0.9984697629085646, "Yes": 0.0015296189911223467}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.013393670960264057, "res": {"No": 0.9866055004903868, "Yes": 0.013393670960264057}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7972307012761553, "res": {"Yes": 0.7972307012761553, "No": 0.20276842797119563}, "ground_truth": 1}, {"key": "40741545", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.23532576281872022, "res": {"No": 0.7646735257275544, "Yes": 0.23532576281872022}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.0008593110452082174, "res": {"No": 0.9991400045082751, "Yes": 0.0008593110452082174}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.0009513933154548242, "res": {"No": 0.99904813953685, "Yes": 0.0009513933154548242}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.20823354846986328, "res": {"No": 0.7917660280035438, "Yes": 0.20823354846986328}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1508849429243987, "res": {"No": 0.8491144466906148, "Yes": 0.1508849429243987}, "ground_truth": 1}, {"key": "36929751", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9956401717657793, "res": {"Yes": 0.9956401717657793, "No": 0.004359060615480567}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.012441905850365004, "res": {"No": 0.987557917790174, "Yes": 0.012441905850365004}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.9965216968605853, "res": {"Yes": 0.9965216968605853, "No": 0.0034779195306189705}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 1.9311437905559218e-05, "res": {"No": 0.9999806147848957, "Yes": 1.9311437905559218e-05}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999180360292298, "res": {"Yes": 0.9999180360292298, "No": 8.16727621746283e-05}, "ground_truth": 1}, {"key": "23984730", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9887706244527463, "res": {"Yes": 0.9887706244527463, "No": 0.01122891647217846}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.23706979204394577, "res": {"No": 0.7629301335322953, "Yes": 0.23706979204394577}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 5.944993667552763e-05, "res": {"No": 0.9999402063417121, "Yes": 5.944993667552763e-05}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 2.5391451390950742e-05, "res": {"No": 0.9999723899261651, "Yes": 2.5391451390950742e-05}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.36353990795066005, "res": {"No": 0.636459622347519, "Yes": 0.36353990795066005}, "ground_truth": 1}, {"key": "36007415", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5246948098451553, "res": {"Yes": 0.5246948098451553, "No": 0.47530422798444566}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_500_ft_gpt35", "target_model": "human", "recognition_score": 0.001994592121338592, "res": {"No": 0.9980010388892725, "Yes": 0.001994592121338592}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_500_ft_gpt35", "target_model": "claude", "recognition_score": 0.9934855844099142, "res": {"Yes": 0.9934855844099142, "No": 0.006514238235198771}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_500_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994717709621076, "res": {"Yes": 0.9994717709621076, "No": 0.0005279832490739496}, "ground_truth": 1}, {"key": "38875041", "model": "cnn_500_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997230904865185, "res": {"Yes": 0.9997230904865185, "No": 0.0002768914516162741}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_500_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999253068846696, "res": {"Yes": 0.9999253068846696, "No": 7.455078402809811e-05}, "ground_truth": 0}]