[{"key": "33773576", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.26303267893963483, "res": {"No": 0.7369508340063228, "Yes": 0.26303267893963483}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6753016898737398, "res": {"Yes": 0.6753016898737398, "No": 0.324680193862967}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7829031042581017, "res": {"Yes": 0.7829031042581017, "No": 0.217082394359352}, "ground_truth": 1}, {"key": "33773576", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7552894090029191, "res": {"Yes": 0.7552894090029191, "No": 0.24469356656272281}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7488856330356226, "res": {"Yes": 0.7488856330356226, "No": 0.25109513192593913}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4487063563293113, "res": {"No": 0.5512775368496288, "Yes": 0.4487063563293113}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7688536036241067, "res": {"Yes": 0.7688536036241067, "No": 0.23112707765548757}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7470285911125844, "res": {"Yes": 0.7470285911125844, "No": 0.25295317156875124}, "ground_truth": 1}, {"key": "37642631", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6782955442823537, "res": {"Yes": 0.6782955442823537, "No": 0.3216820962001682}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7148277459986051, "res": {"Yes": 0.7148277459986051, "No": 0.28514373286526157}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.32622416866030435, "res": {"No": 0.6737633381983553, "Yes": 0.32622416866030435}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7358292091257179, "res": {"Yes": 0.7358292091257179, "No": 0.26414700333346225}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7322168249016352, "res": {"Yes": 0.7322168249016352, "No": 0.26776469175299517}, "ground_truth": 1}, {"key": "36609836", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7291900582844991, "res": {"Yes": 0.7291900582844991, "No": 0.2707899096232351}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8233753557155983, "res": {"Yes": 0.8233753557155983, "No": 0.17660789257380963}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6221258347700119, "res": {"Yes": 0.6221258347700119, "No": 0.377856947786573}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5659256612231651, "res": {"Yes": 0.5659256612231651, "No": 0.4340575977403379}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4307171667184405, "res": {"No": 0.569263932016781, "Yes": 0.4307171667184405}, "ground_truth": 1}, {"key": "41035610", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4773178584994031, "res": {"No": 0.5226636178249434, "Yes": 0.4773178584994031}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.46450005607827266, "res": {"No": 0.5354751636009875, "Yes": 0.46450005607827266}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6104338470152406, "res": {"Yes": 0.6104338470152406, "No": 0.38955259137518206}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6931116372870322, "res": {"Yes": 0.6931116372870322, "No": 0.30686968510401086}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.760092927614152, "res": {"Yes": 0.760092927614152, "No": 0.23989067026326544}, "ground_truth": 1}, {"key": "37592684", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8667558977485038, "res": {"Yes": 0.8667558977485038, "No": 0.13323070892005057}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3999659741969382, "res": {"No": 0.6000170545019698, "Yes": 0.3999659741969382}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4557987976789239, "res": {"No": 0.5441822662438236, "Yes": 0.4557987976789239}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4835442732638186, "res": {"No": 0.5164255727661596, "Yes": 0.4835442732638186}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4836144406283884, "res": {"No": 0.516362572689365, "Yes": 0.4836144406283884}, "ground_truth": 1}, {"key": "38951040", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6273242668669377, "res": {"Yes": 0.6273242668669377, "No": 0.3726540945719197}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5064797329565992, "res": {"Yes": 0.5064797329565992, "No": 0.4934908457135002}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5473212415806975, "res": {"Yes": 0.5473212415806975, "No": 0.45265003578682167}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5135130839482309, "res": {"Yes": 0.5135130839482309, "No": 0.48645528168907576}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6106348898756094, "res": {"Yes": 0.6106348898756094, "No": 0.3893331792593981}, "ground_truth": 1}, {"key": "40774469", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5600235178354629, "res": {"Yes": 0.5600235178354629, "No": 0.4399550000120173}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5859173150254031, "res": {"Yes": 0.5859173150254031, "No": 0.4140512419458429}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.41132523556977096, "res": {"No": 0.5886536493222231, "Yes": 0.41132523556977096}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5009626157213974, "res": {"Yes": 0.5009626157213974, "No": 0.4990162093953439}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5884992657183007, "res": {"Yes": 0.5884992657183007, "No": 0.4114817540274792}, "ground_truth": 1}, {"key": "40876288", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6241487235428261, "res": {"Yes": 0.6241487235428261, "No": 0.3758206665628844}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6049893284696519, "res": {"Yes": 0.6049893284696519, "No": 0.39498576606846897}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5997986460533317, "res": {"Yes": 0.5997986460533317, "No": 0.4001873566140915}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.641334151947496, "res": {"Yes": 0.641334151947496, "No": 0.35863228184001056}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6155773075661773, "res": {"Yes": 0.6155773075661773, "No": 0.38440153832805635}, "ground_truth": 1}, {"key": "40340131", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6902739853423565, "res": {"Yes": 0.6902739853423565, "No": 0.3097098461398363}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6018863974715674, "res": {"Yes": 0.6018863974715674, "No": 0.39809207748112546}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6656143900782044, "res": {"Yes": 0.6656143900782044, "No": 0.33436779808540285}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5428787936927826, "res": {"Yes": 0.5428787936927826, "No": 0.4571000656598775}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7539952128497294, "res": {"Yes": 0.7539952128497294, "No": 0.2459906873665195}, "ground_truth": 1}, {"key": "30121591", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6409016281905447, "res": {"Yes": 0.6409016281905447, "No": 0.3590821810921717}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6335280134958305, "res": {"Yes": 0.6335280134958305, "No": 0.36645164632073446}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3495808897085194, "res": {"No": 0.6504018151053808, "Yes": 0.3495808897085194}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6111994750587753, "res": {"Yes": 0.6111994750587753, "No": 0.38877482461381496}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.44214305297626383, "res": {"No": 0.5578380453707683, "Yes": 0.44214305297626383}, "ground_truth": 1}, {"key": "35623366", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5208446803526082, "res": {"Yes": 0.5208446803526082, "No": 0.4791323092424615}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5151444150784589, "res": {"Yes": 0.5151444150784589, "No": 0.48483509799169594}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4994213953218469, "res": {"No": 0.5005505131223993, "Yes": 0.4994213953218469}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7019987047805357, "res": {"Yes": 0.7019987047805357, "No": 0.297975532962544}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7810784156666213, "res": {"Yes": 0.7810784156666213, "No": 0.21890294957770362}, "ground_truth": 1}, {"key": "41014093", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6736659796931604, "res": {"Yes": 0.6736659796931604, "No": 0.3263039728516134}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7732986369572162, "res": {"Yes": 0.7732986369572162, "No": 0.22667282516581597}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.28498726041808364, "res": {"No": 0.7149985744974335, "Yes": 0.28498726041808364}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6233101194619435, "res": {"Yes": 0.6233101194619435, "No": 0.37666469141069997}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.44761956168630324, "res": {"No": 0.5523653973375336, "Yes": 0.44761956168630324}, "ground_truth": 1}, {"key": "11387984", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5930285714190358, "res": {"Yes": 0.5930285714190358, "No": 0.4069498743375572}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4964892238311618, "res": {"No": 0.5034937147598723, "Yes": 0.4964892238311618}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.13051585047714861, "res": {"No": 0.8694666076570089, "Yes": 0.13051585047714861}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4740688569549329, "res": {"No": 0.5259036804645171, "Yes": 0.4740688569549329}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.31882956435342596, "res": {"No": 0.6811440077931887, "Yes": 0.31882956435342596}, "ground_truth": 1}, {"key": "39508312", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6200264565491188, "res": {"Yes": 0.6200264565491188, "No": 0.3799424823328901}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4501195116652303, "res": {"No": 0.5498531370270214, "Yes": 0.4501195116652303}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.15694987376425146, "res": {"No": 0.8430380041230026, "Yes": 0.15694987376425146}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6012745360473771, "res": {"Yes": 0.6012745360473771, "No": 0.39870435565974965}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4097532089115867, "res": {"No": 0.590225831537814, "Yes": 0.4097532089115867}, "ground_truth": 1}, {"key": "35815369", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6169338951238185, "res": {"Yes": 0.6169338951238185, "No": 0.3830352183931084}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4294010277862138, "res": {"No": 0.5705775987994182, "Yes": 0.4294010277862138}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6078839846158428, "res": {"Yes": 0.6078839846158428, "No": 0.39209404784321594}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3868013597602696, "res": {"No": 0.6131832058988615, "Yes": 0.3868013597602696}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5703900465395666, "res": {"Yes": 0.5703900465395666, "No": 0.4295981680982081}, "ground_truth": 1}, {"key": "35802823", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6298473062530926, "res": {"Yes": 0.6298473062530926, "No": 0.37012831358124376}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5506828419497358, "res": {"Yes": 0.5506828419497358, "No": 0.44930338454742375}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4757139931800413, "res": {"No": 0.5242624506660025, "Yes": 0.4757139931800413}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4236637715337812, "res": {"No": 0.5763096361274836, "Yes": 0.4236637715337812}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7835939137332847, "res": {"Yes": 0.7835939137332847, "No": 0.21638641743320267}, "ground_truth": 1}, {"key": "38499968", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5769314636682309, "res": {"Yes": 0.5769314636682309, "No": 0.4230334605962165}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5588270418800004, "res": {"Yes": 0.5588270418800004, "No": 0.4411420528928639}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7667411256774832, "res": {"Yes": 0.7667411256774832, "No": 0.23323302917356747}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7375899441757888, "res": {"Yes": 0.7375899441757888, "No": 0.2623890114198541}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6373323735348484, "res": {"Yes": 0.6373323735348484, "No": 0.36264891102632035}, "ground_truth": 1}, {"key": "36926726", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.73383922050143, "res": {"Yes": 0.73383922050143, "No": 0.26613456890091786}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.52591220017315, "res": {"Yes": 0.52591220017315, "No": 0.4740647989428856}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.459926695410988, "res": {"No": 0.5400625407101931, "Yes": 0.459926695410988}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.685924469560146, "res": {"Yes": 0.685924469560146, "No": 0.3140541046859969}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7987137721497952, "res": {"Yes": 0.7987137721497952, "No": 0.2012727551514022}, "ground_truth": 1}, {"key": "40903712", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7181588965722125, "res": {"Yes": 0.7181588965722125, "No": 0.28182465280633967}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.607631692185589, "res": {"Yes": 0.607631692185589, "No": 0.3923471870209197}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5804066734613749, "res": {"Yes": 0.5804066734613749, "No": 0.4195786019778418}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6279050802728476, "res": {"Yes": 0.6279050802728476, "No": 0.37206048642869544}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6325212892839215, "res": {"Yes": 0.6325212892839215, "No": 0.36745052325183913}, "ground_truth": 1}, {"key": "19614862", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5991670729347855, "res": {"Yes": 0.5991670729347855, "No": 0.400802777237584}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6695284167612383, "res": {"Yes": 0.6695284167612383, "No": 0.330443892370796}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.22057725117213817, "res": {"No": 0.7793935045678917, "Yes": 0.22057725117213817}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.41197496336938594, "res": {"No": 0.588002252681419, "Yes": 0.41197496336938594}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4888639739918614, "res": {"No": 0.5111138066370393, "Yes": 0.4888639739918614}, "ground_truth": 1}, {"key": "38861704", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3964150541808779, "res": {"No": 0.6035587103968681, "Yes": 0.3964150541808779}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4505551003905253, "res": {"No": 0.5494192542367209, "Yes": 0.4505551003905253}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2979245239177996, "res": {"No": 0.7020620560020192, "Yes": 0.2979245239177996}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7168164846695422, "res": {"Yes": 0.7168164846695422, "No": 0.28316256829440956}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6909558017467777, "res": {"Yes": 0.6909558017467777, "No": 0.30902515426786803}, "ground_truth": 1}, {"key": "34349607", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6904918701925514, "res": {"Yes": 0.6904918701925514, "No": 0.3094845832163744}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8350435832370048, "res": {"Yes": 0.8350435832370048, "No": 0.16493586130766358}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.601349369319792, "res": {"Yes": 0.601349369319792, "No": 0.39863686072594384}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6292720901880388, "res": {"Yes": 0.6292720901880388, "No": 0.3707055341569036}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.697933837077362, "res": {"Yes": 0.697933837077362, "No": 0.3020470436690984}, "ground_truth": 1}, {"key": "20773800", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6263189705703198, "res": {"Yes": 0.6263189705703198, "No": 0.3736577341141138}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6090762828019535, "res": {"Yes": 0.6090762828019535, "No": 0.39089656251213817}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.50276239310584, "res": {"Yes": 0.50276239310584, "No": 0.4972131358721427}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7042054028270524, "res": {"Yes": 0.7042054028270524, "No": 0.29576691032199554}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6806944581227266, "res": {"Yes": 0.6806944581227266, "No": 0.31928463541784574}, "ground_truth": 1}, {"key": "35545608", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7579022344169057, "res": {"Yes": 0.7579022344169057, "No": 0.24207981334237338}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7029919768273285, "res": {"Yes": 0.7029919768273285, "No": 0.29698952801791406}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.481115217566801, "res": {"No": 0.5188530015200531, "Yes": 0.481115217566801}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8167742402753628, "res": {"Yes": 0.8167742402753628, "No": 0.18320330252892086}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8831161869363165, "res": {"Yes": 0.8831161869363165, "No": 0.11686334713520803}, "ground_truth": 1}, {"key": "37258984", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8186750485326325, "res": {"Yes": 0.8186750485326325, "No": 0.18130312948643673}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6831211198960869, "res": {"Yes": 0.6831211198960869, "No": 0.31684816329323934}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5185377488546262, "res": {"Yes": 0.5185377488546262, "No": 0.481444172225456}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5111470812289275, "res": {"Yes": 0.5111470812289275, "No": 0.4888231066719134}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5937229633978426, "res": {"Yes": 0.5937229633978426, "No": 0.40625619346585023}, "ground_truth": 1}, {"key": "37274562", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6042320899320045, "res": {"Yes": 0.6042320899320045, "No": 0.3957401381203453}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5874829233644309, "res": {"Yes": 0.5874829233644309, "No": 0.41248662416492193}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6031994343726225, "res": {"Yes": 0.6031994343726225, "No": 0.39677800343485037}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6511971765942475, "res": {"Yes": 0.6511971765942475, "No": 0.34877355740958205}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.667819200509411, "res": {"Yes": 0.667819200509411, "No": 0.3321537217187157}, "ground_truth": 1}, {"key": "40828068", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6820343880835122, "res": {"Yes": 0.6820343880835122, "No": 0.31793983888375865}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6165252377934439, "res": {"Yes": 0.6165252377934439, "No": 0.3834471681445}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.9086969124978407, "res": {"Yes": 0.9086969124978407, "No": 0.09127298753991184}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5197434263703976, "res": {"Yes": 0.5197434263703976, "No": 0.4802048189248108}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.719294578015314, "res": {"Yes": 0.719294578015314, "No": 0.2806645766642713}, "ground_truth": 1}, {"key": "37807180", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5760931572652912, "res": {"Yes": 0.5760931572652912, "No": 0.4238699044327169}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4809514978650828, "res": {"No": 0.5189752940166916, "Yes": 0.4809514978650828}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.540020109663295, "res": {"Yes": 0.540020109663295, "No": 0.4599598665203969}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4622078487504063, "res": {"No": 0.5377661547012926, "Yes": 0.4622078487504063}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5779957287748225, "res": {"Yes": 0.5779957287748225, "No": 0.42196913813582065}, "ground_truth": 1}, {"key": "40748607", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6367432919521312, "res": {"Yes": 0.6367432919521312, "No": 0.3632374595666272}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6675479540598697, "res": {"Yes": 0.6675479540598697, "No": 0.3324294240209097}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.41458232970186354, "res": {"No": 0.5853923926150655, "Yes": 0.41458232970186354}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7530370418712886, "res": {"Yes": 0.7530370418712886, "No": 0.24694466396094034}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5314045943216841, "res": {"Yes": 0.5314045943216841, "No": 0.4685704102071603}, "ground_truth": 1}, {"key": "40123819", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5178048733829148, "res": {"Yes": 0.5178048733829148, "No": 0.48217334145888807}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5757146156543501, "res": {"Yes": 0.5757146156543501, "No": 0.4242576428765072}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.43530284270279923, "res": {"No": 0.5646716314852899, "Yes": 0.43530284270279923}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7152338405764291, "res": {"Yes": 0.7152338405764291, "No": 0.2847419350416811}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7046774067282505, "res": {"Yes": 0.7046774067282505, "No": 0.2952935891751754}, "ground_truth": 1}, {"key": "38453867", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6629233011687056, "res": {"Yes": 0.6629233011687056, "No": 0.33705198579750023}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6755819374326223, "res": {"Yes": 0.6755819374326223, "No": 0.3243864912080182}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5353948055186556, "res": {"Yes": 0.5353948055186556, "No": 0.4645818431576511}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5833641929103074, "res": {"Yes": 0.5833641929103074, "No": 0.41661510208840846}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5920448777270301, "res": {"Yes": 0.5920448777270301, "No": 0.40793107609016743}, "ground_truth": 1}, {"key": "38944856", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.41689357732784005, "res": {"No": 0.583092041178989, "Yes": 0.41689357732784005}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.2600519656637616, "res": {"No": 0.7399365793779433, "Yes": 0.2600519656637616}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.40044189666086294, "res": {"No": 0.5995383119806248, "Yes": 0.40044189666086294}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.36238644823773153, "res": {"No": 0.6375930639100368, "Yes": 0.36238644823773153}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2782048684014926, "res": {"No": 0.721773688540647, "Yes": 0.2782048684014926}, "ground_truth": 1}, {"key": "35778898", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4134982899818906, "res": {"No": 0.5864767814457719, "Yes": 0.4134982899818906}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.46920176522888213, "res": {"No": 0.5307785436526571, "Yes": 0.46920176522888213}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3919906231552877, "res": {"No": 0.6079694043955473, "Yes": 0.3919906231552877}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7229649619723322, "res": {"Yes": 0.7229649619723322, "No": 0.27700855189616896}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6905695203691539, "res": {"Yes": 0.6905695203691539, "No": 0.3093977849648061}, "ground_truth": 1}, {"key": "32530125", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6101562421131063, "res": {"Yes": 0.6101562421131063, "No": 0.38980789427393897}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6060962967554039, "res": {"Yes": 0.6060962967554039, "No": 0.3938719194781346}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.33184413274150737, "res": {"No": 0.6681403384572024, "Yes": 0.33184413274150737}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7406369498279589, "res": {"Yes": 0.7406369498279589, "No": 0.2593392315407737}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7615361924016749, "res": {"Yes": 0.7615361924016749, "No": 0.23844714678109866}, "ground_truth": 1}, {"key": "35010363", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8076410210998681, "res": {"Yes": 0.8076410210998681, "No": 0.19233127559734736}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8703375970642335, "res": {"Yes": 0.8703375970642335, "No": 0.12964079089830008}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5865830606671766, "res": {"Yes": 0.5865830606671766, "No": 0.41338790067609354}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5396735657946518, "res": {"Yes": 0.5396735657946518, "No": 0.46029812573537654}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6847941341341964, "res": {"Yes": 0.6847941341341964, "No": 0.3151763990223196}, "ground_truth": 1}, {"key": "27514800", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6894549093802241, "res": {"Yes": 0.6894549093802241, "No": 0.31050986710424705}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7303900152821339, "res": {"Yes": 0.7303900152821339, "No": 0.2695830426782122}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3256461879600664, "res": {"No": 0.674333219022043, "Yes": 0.3256461879600664}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.856152452485561, "res": {"Yes": 0.856152452485561, "No": 0.14381972117755648}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7744527717525026, "res": {"Yes": 0.7744527717525026, "No": 0.2255200974644157}, "ground_truth": 1}, {"key": "25725840", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7379394675763071, "res": {"Yes": 0.7379394675763071, "No": 0.26204063285840584}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6984905844826161, "res": {"Yes": 0.6984905844826161, "No": 0.3014743925262202}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6459881752071254, "res": {"Yes": 0.6459881752071254, "No": 0.3539655807837091}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7087686006366751, "res": {"Yes": 0.7087686006366751, "No": 0.291197805134749}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.521023412822239, "res": {"Yes": 0.521023412822239, "No": 0.4789467101771412}, "ground_truth": 1}, {"key": "38327225", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6706150517523932, "res": {"Yes": 0.6706150517523932, "No": 0.32935486252485635}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6989046466514353, "res": {"Yes": 0.6989046466514353, "No": 0.3010644853908094}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4594827402113138, "res": {"No": 0.5404991578491596, "Yes": 0.4594827402113138}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5588986098533831, "res": {"Yes": 0.5588986098533831, "No": 0.44107735974345125}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5767664041154132, "res": {"Yes": 0.5767664041154132, "No": 0.4232077439698327}, "ground_truth": 1}, {"key": "11991724", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6404306104808253, "res": {"Yes": 0.6404306104808253, "No": 0.35953282450310803}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6043807190914449, "res": {"Yes": 0.6043807190914449, "No": 0.39558991993722864}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4052539140718657, "res": {"No": 0.5947327702225731, "Yes": 0.4052539140718657}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.725390578662703, "res": {"Yes": 0.725390578662703, "No": 0.27458827088951643}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.721847241026945, "res": {"Yes": 0.721847241026945, "No": 0.27813290611076075}, "ground_truth": 1}, {"key": "32217545", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6333404916210726, "res": {"Yes": 0.6333404916210726, "No": 0.36663748441139427}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6342532350021166, "res": {"Yes": 0.6342532350021166, "No": 0.36572810652449445}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5038434874058375, "res": {"Yes": 0.5038434874058375, "No": 0.49613808193639375}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8416722771855284, "res": {"Yes": 0.8416722771855284, "No": 0.15830608075145194}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6444701194832523, "res": {"Yes": 0.6444701194832523, "No": 0.35550722729562245}, "ground_truth": 1}, {"key": "12731847", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6937613040001286, "res": {"Yes": 0.6937613040001286, "No": 0.30621907555542605}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5343332505334171, "res": {"Yes": 0.5343332505334171, "No": 0.46564590230476793}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.29326612668569874, "res": {"No": 0.7067204601695143, "Yes": 0.29326612668569874}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5934526791239796, "res": {"Yes": 0.5934526791239796, "No": 0.40652071170029747}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5557441958539086, "res": {"Yes": 0.5557441958539086, "No": 0.44423552299351193}, "ground_truth": 1}, {"key": "36827234", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6530215818144604, "res": {"Yes": 0.6530215818144604, "No": 0.3469561069415571}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5302464926927768, "res": {"Yes": 0.5302464926927768, "No": 0.4697365139945401}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5802524392760866, "res": {"Yes": 0.5802524392760866, "No": 0.41972320108755223}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6098477885006186, "res": {"Yes": 0.6098477885006186, "No": 0.390134354682019}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.46269349590382497, "res": {"No": 0.5372859128488818, "Yes": 0.46269349590382497}, "ground_truth": 1}, {"key": "29111539", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4260189841386278, "res": {"No": 0.5739626812615112, "Yes": 0.4260189841386278}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5537397544034051, "res": {"Yes": 0.5537397544034051, "No": 0.44623763274902306}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5133407624716116, "res": {"Yes": 0.5133407624716116, "No": 0.48664647185364296}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6091022787324527, "res": {"Yes": 0.6091022787324527, "No": 0.3908774637726798}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.646795699621673, "res": {"Yes": 0.646795699621673, "No": 0.35318192024387673}, "ground_truth": 1}, {"key": "37763052", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.36613260589906255, "res": {"No": 0.6338463652593344, "Yes": 0.36613260589906255}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7301172363459192, "res": {"Yes": 0.7301172363459192, "No": 0.26986247543160025}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3532436265152292, "res": {"No": 0.6467421730245335, "Yes": 0.3532436265152292}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5566469232967536, "res": {"Yes": 0.5566469232967536, "No": 0.4433322899204995}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.733076307142598, "res": {"Yes": 0.733076307142598, "No": 0.26690806652627064}, "ground_truth": 1}, {"key": "30682335", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7456066624211457, "res": {"Yes": 0.7456066624211457, "No": 0.25437566717187987}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6104895760648484, "res": {"Yes": 0.6104895760648484, "No": 0.389487853114394}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.40189231475157466, "res": {"No": 0.598079285124338, "Yes": 0.40189231475157466}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6635271544323986, "res": {"Yes": 0.6635271544323986, "No": 0.3364452659623763}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.773523691870361, "res": {"Yes": 0.773523691870361, "No": 0.2264574297153816}, "ground_truth": 1}, {"key": "12261276", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7227846191705157, "res": {"Yes": 0.7227846191705157, "No": 0.2771804058864688}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6675301307674383, "res": {"Yes": 0.6675301307674383, "No": 0.3324478411211494}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.35051148695210316, "res": {"No": 0.6494693981459695, "Yes": 0.35051148695210316}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7260103340717777, "res": {"Yes": 0.7260103340717777, "No": 0.2739619365348648}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7134611310523126, "res": {"Yes": 0.7134611310523126, "No": 0.286515770204048}, "ground_truth": 1}, {"key": "36912979", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6293382930941384, "res": {"Yes": 0.6293382930941384, "No": 0.37063704892927296}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7591997431523727, "res": {"Yes": 0.7591997431523727, "No": 0.24077333662013567}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3966900237003621, "res": {"No": 0.6032831039365201, "Yes": 0.3966900237003621}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5372712451436761, "res": {"Yes": 0.5372712451436761, "No": 0.46269851152850516}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4096648879323604, "res": {"No": 0.5903023592776764, "Yes": 0.4096648879323604}, "ground_truth": 1}, {"key": "30205259", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.43068560922775784, "res": {"No": 0.5692808394066355, "Yes": 0.43068560922775784}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4143427289203417, "res": {"No": 0.5856413133910336, "Yes": 0.4143427289203417}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5518651809197994, "res": {"Yes": 0.5518651809197994, "No": 0.4481175914921508}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.1093760537571153, "res": {"No": 0.8906115120541958, "Yes": 0.1093760537571153}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.45364600942476413, "res": {"No": 0.5463338736061397, "Yes": 0.45364600942476413}, "ground_truth": 1}, {"key": "39458032", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.38379264086235115, "res": {"No": 0.6161832967818083, "Yes": 0.38379264086235115}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4578197185407186, "res": {"No": 0.5421542087614548, "Yes": 0.4578197185407186}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5328299440713911, "res": {"Yes": 0.5328299440713911, "No": 0.4671224593964764}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6113382025211432, "res": {"Yes": 0.6113382025211432, "No": 0.38862725815223664}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7156247081964751, "res": {"Yes": 0.7156247081964751, "No": 0.28433948073153964}, "ground_truth": 1}, {"key": "35116452", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7362125214234808, "res": {"Yes": 0.7362125214234808, "No": 0.26375028859326116}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45237269158070187, "res": {"No": 0.5476007313574394, "Yes": 0.45237269158070187}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6601470802005874, "res": {"Yes": 0.6601470802005874, "No": 0.3398372678226539}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4095659002767028, "res": {"No": 0.5904130513470982, "Yes": 0.4095659002767028}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5518649932856698, "res": {"Yes": 0.5518649932856698, "No": 0.4481054476699709}, "ground_truth": 1}, {"key": "40107476", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5930608330508295, "res": {"Yes": 0.5930608330508295, "No": 0.40691145601348655}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.49361688456335573, "res": {"No": 0.506362734459496, "Yes": 0.49361688456335573}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3344345780024333, "res": {"No": 0.6655492096525957, "Yes": 0.3344345780024333}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5010158007356931, "res": {"Yes": 0.5010158007356931, "No": 0.49895402088052476}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3328359343675584, "res": {"No": 0.6671414944212417, "Yes": 0.3328359343675584}, "ground_truth": 1}, {"key": "39501049", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4342763484234279, "res": {"No": 0.5657002696313677, "Yes": 0.4342763484234279}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3922856521906307, "res": {"No": 0.6076951504766209, "Yes": 0.3922856521906307}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3075524614333023, "res": {"No": 0.6924341054728266, "Yes": 0.3075524614333023}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.38577496953336987, "res": {"No": 0.6142108658932137, "Yes": 0.38577496953336987}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7026814214085091, "res": {"Yes": 0.7026814214085091, "No": 0.29730203620815765}, "ground_truth": 1}, {"key": "39642178", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.34627531923833266, "res": {"No": 0.6537085951416952, "Yes": 0.34627531923833266}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.46383176867970743, "res": {"No": 0.5361508612270056, "Yes": 0.46383176867970743}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.8670215211158827, "res": {"Yes": 0.8670215211158827, "No": 0.13296257251834617}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8836808861806045, "res": {"Yes": 0.8836808861806045, "No": 0.1163039100086352}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8779879586172558, "res": {"Yes": 0.8779879586172558, "No": 0.12199441670612622}, "ground_truth": 1}, {"key": "38024796", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8941313997705063, "res": {"Yes": 0.8941313997705063, "No": 0.10585047435738656}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8712830705831998, "res": {"Yes": 0.8712830705831998, "No": 0.12869823223785393}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.65413332987033, "res": {"Yes": 0.65413332987033, "No": 0.34584796776907845}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6022151773984148, "res": {"Yes": 0.6022151773984148, "No": 0.39776215612748217}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6149093010617102, "res": {"Yes": 0.6149093010617102, "No": 0.3850669244733858}, "ground_truth": 1}, {"key": "36652079", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4221390824415734, "res": {"No": 0.5778415400840714, "Yes": 0.4221390824415734}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.37246982543025964, "res": {"No": 0.627511802116051, "Yes": 0.37246982543025964}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6547139672144088, "res": {"Yes": 0.6547139672144088, "No": 0.345265428425387}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6466087380115153, "res": {"Yes": 0.6466087380115153, "No": 0.3533769304817253}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7280921784870806, "res": {"Yes": 0.7280921784870806, "No": 0.2718866030948086}, "ground_truth": 1}, {"key": "32193402", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7916797856273896, "res": {"Yes": 0.7916797856273896, "No": 0.20830502648862453}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8387523155371721, "res": {"Yes": 0.8387523155371721, "No": 0.16123360546661872}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5077375290625172, "res": {"Yes": 0.5077375290625172, "No": 0.4922475197863619}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7672629554956677, "res": {"Yes": 0.7672629554956677, "No": 0.23271519782468394}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7802544145353197, "res": {"Yes": 0.7802544145353197, "No": 0.21972100423425062}, "ground_truth": 1}, {"key": "32589706", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7766022767495745, "res": {"Yes": 0.7766022767495745, "No": 0.22337325891091644}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7644848658119554, "res": {"Yes": 0.7644848658119554, "No": 0.2354962239115679}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4875433643438837, "res": {"No": 0.5124362325518453, "Yes": 0.4875433643438837}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5601546010783398, "res": {"Yes": 0.5601546010783398, "No": 0.43982638917055583}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6193857610514827, "res": {"Yes": 0.6193857610514827, "No": 0.3805923059138771}, "ground_truth": 1}, {"key": "38590589", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7355872788289486, "res": {"Yes": 0.7355872788289486, "No": 0.2643927743123536}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6745158464401454, "res": {"Yes": 0.6745158464401454, "No": 0.3254586372203604}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.30380443211598673, "res": {"No": 0.6961412248247838, "Yes": 0.30380443211598673}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7976486872567321, "res": {"Yes": 0.7976486872567321, "No": 0.20229244116296644}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5996820745198698, "res": {"Yes": 0.5996820745198698, "No": 0.40023933632345776}, "ground_truth": 1}, {"key": "37045414", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5397301967129998, "res": {"Yes": 0.5397301967129998, "No": 0.46022702897519385}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3577945285311453, "res": {"No": 0.6421540633602267, "Yes": 0.3577945285311453}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.19340052139993602, "res": {"No": 0.8065875192060391, "Yes": 0.19340052139993602}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.07873076382529823, "res": {"No": 0.9212571631875003, "Yes": 0.07873076382529823}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2566523586181333, "res": {"No": 0.7433326667093868, "Yes": 0.2566523586181333}, "ground_truth": 1}, {"key": "33310095", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.20821797318296068, "res": {"No": 0.7917717049863164, "Yes": 0.20821797318296068}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.25460083836323866, "res": {"No": 0.7453832972169634, "Yes": 0.25460083836323866}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.33180603922167856, "res": {"No": 0.668179626264154, "Yes": 0.33180603922167856}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7131359025992002, "res": {"Yes": 0.7131359025992002, "No": 0.28684324416949886}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7464124869651856, "res": {"Yes": 0.7464124869651856, "No": 0.2535625096392981}, "ground_truth": 1}, {"key": "37934604", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6747034621298893, "res": {"Yes": 0.6747034621298893, "No": 0.32527421953369345}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6108391997373032, "res": {"Yes": 0.6108391997373032, "No": 0.38914045643771394}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3757502819437625, "res": {"No": 0.624197246750667, "Yes": 0.3757502819437625}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.42238113882076317, "res": {"No": 0.5775611469654827, "Yes": 0.42238113882076317}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4391962794589285, "res": {"No": 0.5607482648076899, "Yes": 0.4391962794589285}, "ground_truth": 1}, {"key": "39012181", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.38145549232672843, "res": {"No": 0.6184776274966652, "Yes": 0.38145549232672843}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4111270656916171, "res": {"No": 0.5888247369305416, "Yes": 0.4111270656916171}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4047037746951018, "res": {"No": 0.5952749793660355, "Yes": 0.4047037746951018}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.57106812397871, "res": {"Yes": 0.57106812397871, "No": 0.4289087013795589}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6209351939889489, "res": {"Yes": 0.6209351939889489, "No": 0.3790426679095918}, "ground_truth": 1}, {"key": "40221674", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5972580884778664, "res": {"Yes": 0.5972580884778664, "No": 0.40271844856249966}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4347020174419002, "res": {"No": 0.5652727901094694, "Yes": 0.4347020174419002}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5212054380891998, "res": {"Yes": 0.5212054380891998, "No": 0.4787742294263881}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6639994219920385, "res": {"Yes": 0.6639994219920385, "No": 0.3359739338014951}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6771632078588128, "res": {"Yes": 0.6771632078588128, "No": 0.3228105694799068}, "ground_truth": 1}, {"key": "36884862", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6575273623859559, "res": {"Yes": 0.6575273623859559, "No": 0.3424538756444054}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6363807062472472, "res": {"Yes": 0.6363807062472472, "No": 0.36359677003876295}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3618196484518867, "res": {"No": 0.6381579664293506, "Yes": 0.3618196484518867}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.607926288734287, "res": {"Yes": 0.607926288734287, "No": 0.3920518019855973}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.677752996070551, "res": {"Yes": 0.677752996070551, "No": 0.3222245874527912}, "ground_truth": 1}, {"key": "39054429", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6441165828444723, "res": {"Yes": 0.6441165828444723, "No": 0.35586084833689174}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8109272361813338, "res": {"Yes": 0.8109272361813338, "No": 0.1890506330624341}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5150550298238462, "res": {"Yes": 0.5150550298238462, "No": 0.4849229823174834}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8203005840320149, "res": {"Yes": 0.8203005840320149, "No": 0.17967103203420973}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6409273032240375, "res": {"Yes": 0.6409273032240375, "No": 0.35904038635879326}, "ground_truth": 1}, {"key": "36753964", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7566111423662207, "res": {"Yes": 0.7566111423662207, "No": 0.24335714065145814}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7691397472837416, "res": {"Yes": 0.7691397472837416, "No": 0.23083193208432362}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.501998122167297, "res": {"Yes": 0.501998122167297, "No": 0.4979651919913471}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6651700345214225, "res": {"Yes": 0.6651700345214225, "No": 0.33480232364287377}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6279934264531576, "res": {"Yes": 0.6279934264531576, "No": 0.3719701945858442}, "ground_truth": 1}, {"key": "37612459", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.572276793457761, "res": {"Yes": 0.572276793457761, "No": 0.4276853574062197}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6530133080834329, "res": {"Yes": 0.6530133080834329, "No": 0.3469536782573089}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.576787854456849, "res": {"Yes": 0.576787854456849, "No": 0.42318798062966695}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4603866956149172, "res": {"No": 0.539597223575493, "Yes": 0.4603866956149172}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.41722601567402917, "res": {"No": 0.5827517139088895, "Yes": 0.41722601567402917}, "ground_truth": 1}, {"key": "36805789", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3558317756932163, "res": {"No": 0.6441388696637984, "Yes": 0.3558317756932163}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4036360796194466, "res": {"No": 0.5963420721504273, "Yes": 0.4036360796194466}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3570632292999926, "res": {"No": 0.6429216325567398, "Yes": 0.3570632292999926}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6377120690081697, "res": {"Yes": 0.6377120690081697, "No": 0.362270213310216}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5411656796376589, "res": {"Yes": 0.5411656796376589, "No": 0.458805915680049}, "ground_truth": 1}, {"key": "12757394", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6736038234008388, "res": {"Yes": 0.6736038234008388, "No": 0.3263647363082606}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5379069441740351, "res": {"Yes": 0.5379069441740351, "No": 0.462072303067114}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.20291352011374178, "res": {"No": 0.7970666241674865, "Yes": 0.20291352011374178}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.2586955994961396, "res": {"No": 0.7412830595014865, "Yes": 0.2586955994961396}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.29498608300776963, "res": {"No": 0.7049916501492044, "Yes": 0.29498608300776963}, "ground_truth": 1}, {"key": "32192542", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.39603356944293455, "res": {"No": 0.6039435775880849, "Yes": 0.39603356944293455}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45808249087739095, "res": {"No": 0.5418945628248933, "Yes": 0.45808249087739095}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.550447745067327, "res": {"Yes": 0.550447745067327, "No": 0.44952720684251246}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5797948412493087, "res": {"Yes": 0.5797948412493087, "No": 0.4201864784215933}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8451734300682855, "res": {"Yes": 0.8451734300682855, "No": 0.1548043217398703}, "ground_truth": 1}, {"key": "34856060", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8507426883465742, "res": {"Yes": 0.8507426883465742, "No": 0.14924045229178418}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.46484205395932826, "res": {"No": 0.5351370803247772, "Yes": 0.46484205395932826}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.544957919078471, "res": {"Yes": 0.544957919078471, "No": 0.45502204984845374}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.306513187018874, "res": {"No": 0.6934574614787846, "Yes": 0.306513187018874}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.31389702271475417, "res": {"No": 0.6860824492961195, "Yes": 0.31389702271475417}, "ground_truth": 1}, {"key": "36083416", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4515835379927632, "res": {"No": 0.5483936283386327, "Yes": 0.4515835379927632}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5268547105535063, "res": {"Yes": 0.5268547105535063, "No": 0.4731188138319121}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.48514968829647864, "res": {"No": 0.5148321262007126, "Yes": 0.48514968829647864}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.32615609278027013, "res": {"No": 0.6738270724867812, "Yes": 0.32615609278027013}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7361373358780829, "res": {"Yes": 0.7361373358780829, "No": 0.2638506646734092}, "ground_truth": 1}, {"key": "33839050", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.49387364690810986, "res": {"No": 0.5061046059166598, "Yes": 0.49387364690810986}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.627778833812551, "res": {"Yes": 0.627778833812551, "No": 0.37219716190169844}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.06329383803430508, "res": {"No": 0.9366956104158831, "Yes": 0.06329383803430508}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6988950228007113, "res": {"Yes": 0.6988950228007113, "No": 0.3010879392277364}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8205988339069351, "res": {"Yes": 0.8205988339069351, "No": 0.17939318819605007}, "ground_truth": 1}, {"key": "18464690", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.65216794882745, "res": {"Yes": 0.65216794882745, "No": 0.34781626944266314}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7590360393797556, "res": {"Yes": 0.7590360393797556, "No": 0.24095155073408203}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.49906276977968866, "res": {"No": 0.5009242935471366, "Yes": 0.49906276977968866}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7384645875664767, "res": {"Yes": 0.7384645875664767, "No": 0.2615108512924154}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7524480660174285, "res": {"Yes": 0.7524480660174285, "No": 0.24752173070484562}, "ground_truth": 1}, {"key": "39212665", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6480008311446839, "res": {"Yes": 0.6480008311446839, "No": 0.351974094944456}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7116051827372026, "res": {"Yes": 0.7116051827372026, "No": 0.2883679529186472}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5587920045229071, "res": {"Yes": 0.5587920045229071, "No": 0.44118759874944125}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6519610422441076, "res": {"Yes": 0.6519610422441076, "No": 0.3480170869437409}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.45043024634690043, "res": {"No": 0.5495509823034929, "Yes": 0.45043024634690043}, "ground_truth": 1}, {"key": "40094011", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6658307965197025, "res": {"Yes": 0.6658307965197025, "No": 0.33413856726170965}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5648664768070377, "res": {"Yes": 0.5648664768070377, "No": 0.43510599974643516}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5064726270957935, "res": {"Yes": 0.5064726270957935, "No": 0.4935083994950744}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.47997133289457505, "res": {"No": 0.5200012570529847, "Yes": 0.47997133289457505}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5655986789860549, "res": {"Yes": 0.5655986789860549, "No": 0.43437481003181716}, "ground_truth": 1}, {"key": "36036272", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6385650176209483, "res": {"Yes": 0.6385650176209483, "No": 0.36141358919327765}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.564346891896365, "res": {"Yes": 0.564346891896365, "No": 0.43562295146403046}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4891531247386763, "res": {"No": 0.5108340841770906, "Yes": 0.4891531247386763}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5395223326784092, "res": {"Yes": 0.5395223326784092, "No": 0.4604606396557805}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6520910823215381, "res": {"Yes": 0.6520910823215381, "No": 0.34789067530011963}, "ground_truth": 1}, {"key": "30681904", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.693653404758446, "res": {"Yes": 0.693653404758446, "No": 0.3063262403573516}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5983122524635502, "res": {"Yes": 0.5983122524635502, "No": 0.40167022614217723}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.186178441920798, "res": {"No": 0.8138007351990908, "Yes": 0.186178441920798}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7853625191231042, "res": {"Yes": 0.7853625191231042, "No": 0.21461078366030728}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8211720499788973, "res": {"Yes": 0.8211720499788973, "No": 0.1788029173679991}, "ground_truth": 1}, {"key": "27834240", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7825982463564434, "res": {"Yes": 0.7825982463564434, "No": 0.2173673716424885}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7518843926715377, "res": {"Yes": 0.7518843926715377, "No": 0.2480941668119295}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44271759291289947, "res": {"No": 0.5572508730532635, "Yes": 0.44271759291289947}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6210184980327164, "res": {"Yes": 0.6210184980327164, "No": 0.3789445843596956}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6401367842972499, "res": {"Yes": 0.6401367842972499, "No": 0.35983769371047475}, "ground_truth": 1}, {"key": "35025075", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.689010781534636, "res": {"Yes": 0.689010781534636, "No": 0.3109585983317322}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6026576729571781, "res": {"Yes": 0.6026576729571781, "No": 0.39731411082157686}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.42263089902151507, "res": {"No": 0.5773474080416477, "Yes": 0.42263089902151507}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5955794391543129, "res": {"Yes": 0.5955794391543129, "No": 0.4044006032988559}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8035572705428923, "res": {"Yes": 0.8035572705428923, "No": 0.19642313395569924}, "ground_truth": 1}, {"key": "33316985", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7698431932521268, "res": {"Yes": 0.7698431932521268, "No": 0.23013221209908544}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.43649666240389273, "res": {"No": 0.5634719076908192, "Yes": 0.43649666240389273}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.21147690133629787, "res": {"No": 0.7885079343834963, "Yes": 0.21147690133629787}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7624768969816916, "res": {"Yes": 0.7624768969816916, "No": 0.23750044068342613}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6497892756249889, "res": {"Yes": 0.6497892756249889, "No": 0.35018951486442884}, "ground_truth": 1}, {"key": "17037056", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7884975576873586, "res": {"Yes": 0.7884975576873586, "No": 0.2114821883249184}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.46920451006723735, "res": {"No": 0.5307785967305141, "Yes": 0.46920451006723735}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3919032973729021, "res": {"No": 0.6080832573256683, "Yes": 0.3919032973729021}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5909544424974396, "res": {"Yes": 0.5909544424974396, "No": 0.4090229712872496}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6661781578069376, "res": {"Yes": 0.6661781578069376, "No": 0.3337955163465323}, "ground_truth": 1}, {"key": "34050457", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5982622954762028, "res": {"Yes": 0.5982622954762028, "No": 0.4017117690251103}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4841582320359277, "res": {"No": 0.5158184069273262, "Yes": 0.4841582320359277}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3582067304103791, "res": {"No": 0.6417716525166894, "Yes": 0.3582067304103791}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5705501546769524, "res": {"Yes": 0.5705501546769524, "No": 0.4294197071371954}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6694820869978267, "res": {"Yes": 0.6694820869978267, "No": 0.33049227289800726}, "ground_truth": 1}, {"key": "34713745", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7147623279568666, "res": {"Yes": 0.7147623279568666, "No": 0.28520193664063265}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6174556221661289, "res": {"Yes": 0.6174556221661289, "No": 0.3825118866458886}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.1828698465896159, "res": {"No": 0.817093498027364, "Yes": 0.1828698465896159}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.2453490471719314, "res": {"No": 0.7546133727261158, "Yes": 0.2453490471719314}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.45683662798491376, "res": {"No": 0.5431302047714358, "Yes": 0.45683662798491376}, "ground_truth": 1}, {"key": "40856210", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.41206879311131206, "res": {"No": 0.5878883088863598, "Yes": 0.41206879311131206}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.46864883202707125, "res": {"No": 0.5313060279117546, "Yes": 0.46864883202707125}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.33424527474117877, "res": {"No": 0.6657411817257018, "Yes": 0.33424527474117877}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6167251415119266, "res": {"Yes": 0.6167251415119266, "No": 0.38325048336678413}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5315619452573886, "res": {"Yes": 0.5315619452573886, "No": 0.46840976495770237}, "ground_truth": 1}, {"key": "40848302", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.548892789382054, "res": {"Yes": 0.548892789382054, "No": 0.4510877007312018}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.747229770585896, "res": {"Yes": 0.747229770585896, "No": 0.25275551533853846}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.17568418486356233, "res": {"No": 0.8242876831235957, "Yes": 0.17568418486356233}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5130992924531451, "res": {"Yes": 0.5130992924531451, "No": 0.4868500835227137}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6201872192459433, "res": {"Yes": 0.6201872192459433, "No": 0.3797533370701625}, "ground_truth": 1}, {"key": "40636168", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.57040548150306, "res": {"Yes": 0.57040548150306, "No": 0.4295467053203519}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3624449058863148, "res": {"No": 0.6375013654943043, "Yes": 0.3624449058863148}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.35836878396019134, "res": {"No": 0.6416090802632342, "Yes": 0.35836878396019134}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.719840153966072, "res": {"Yes": 0.719840153966072, "No": 0.280121539598324}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7721523221003227, "res": {"Yes": 0.7721523221003227, "No": 0.22782547583577975}, "ground_truth": 1}, {"key": "34423311", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7355216232386929, "res": {"Yes": 0.7355216232386929, "No": 0.2644523751604469}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5369756661135029, "res": {"Yes": 0.5369756661135029, "No": 0.4629990855277062}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.36756963326716036, "res": {"No": 0.63241743781466, "Yes": 0.36756963326716036}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.35960178951238064, "res": {"No": 0.6403775850215617, "Yes": 0.35960178951238064}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3164381421320842, "res": {"No": 0.683551348374887, "Yes": 0.3164381421320842}, "ground_truth": 1}, {"key": "34833945", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.21082543715060909, "res": {"No": 0.7891615075774825, "Yes": 0.21082543715060909}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.2570132086197573, "res": {"No": 0.7429706998261735, "Yes": 0.2570132086197573}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.17645268715295948, "res": {"No": 0.82352150134231, "Yes": 0.17645268715295948}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6114625307852737, "res": {"Yes": 0.6114625307852737, "No": 0.3885120861022613}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6168929752556773, "res": {"Yes": 0.6168929752556773, "No": 0.38306969311410294}, "ground_truth": 1}, {"key": "21272328", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6369194395067689, "res": {"Yes": 0.6369194395067689, "No": 0.3630553416505388}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45297241019530143, "res": {"No": 0.5470011085295285, "Yes": 0.45297241019530143}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2717313458128219, "res": {"No": 0.728237316284049, "Yes": 0.2717313458128219}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.46694682168127893, "res": {"No": 0.5330198571869695, "Yes": 0.46694682168127893}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6205981425270319, "res": {"Yes": 0.6205981425270319, "No": 0.37937777596090805}, "ground_truth": 1}, {"key": "38648957", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5928231818974151, "res": {"Yes": 0.5928231818974151, "No": 0.4071333931254326}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4335062783225914, "res": {"No": 0.5664652737726197, "Yes": 0.4335062783225914}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4741550030923811, "res": {"No": 0.5258287077213523, "Yes": 0.4741550030923811}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6816014746207235, "res": {"Yes": 0.6816014746207235, "No": 0.3183701752807288}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6854940567268951, "res": {"Yes": 0.6854940567268951, "No": 0.3144610053113616}, "ground_truth": 1}, {"key": "24942981", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7249963055018235, "res": {"Yes": 0.7249963055018235, "No": 0.27495929787419243}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6447084563697477, "res": {"Yes": 0.6447084563697477, "No": 0.35525085686578367}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.011763207818801852, "res": {"No": 0.9882261773402674, "Yes": 0.011763207818801852}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4175486811215122, "res": {"No": 0.5824120453794039, "Yes": 0.4175486811215122}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.46349721621634105, "res": {"No": 0.5364809636606935, "Yes": 0.46349721621634105}, "ground_truth": 1}, {"key": "35882366", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.34887778651958956, "res": {"No": 0.6510962293210901, "Yes": 0.34887778651958956}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.33833850181180203, "res": {"No": 0.6616265010991397, "Yes": 0.33833850181180203}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.500337454104034, "res": {"Yes": 0.500337454104034, "No": 0.499646040626371}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5963559253376676, "res": {"Yes": 0.5963559253376676, "No": 0.4036308323845186}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6677438480422917, "res": {"Yes": 0.6677438480422917, "No": 0.33224677100711364}, "ground_truth": 1}, {"key": "40559523", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5478593640038482, "res": {"Yes": 0.5478593640038482, "No": 0.4521230281560022}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6351371177088135, "res": {"Yes": 0.6351371177088135, "No": 0.364846121216538}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.37020963970508514, "res": {"No": 0.6297730138466993, "Yes": 0.37020963970508514}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8023113094790435, "res": {"Yes": 0.8023113094790435, "No": 0.19767599055687762}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7786536192053717, "res": {"Yes": 0.7786536192053717, "No": 0.22132913206234464}, "ground_truth": 1}, {"key": "24632722", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7405002927006649, "res": {"Yes": 0.7405002927006649, "No": 0.25948481356400926}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7635363238599887, "res": {"Yes": 0.7635363238599887, "No": 0.23644815803619762}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6687825560586426, "res": {"Yes": 0.6687825560586426, "No": 0.3312014759864948}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7510475602466329, "res": {"Yes": 0.7510475602466329, "No": 0.24893036008704456}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7322808234488273, "res": {"Yes": 0.7322808234488273, "No": 0.26769976668772744}, "ground_truth": 1}, {"key": "36002759", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7576281355971736, "res": {"Yes": 0.7576281355971736, "No": 0.242353033438988}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7673889657646392, "res": {"Yes": 0.7673889657646392, "No": 0.2325910076014046}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4247556570408545, "res": {"No": 0.5752317188838351, "Yes": 0.4247556570408545}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.48783263159451845, "res": {"No": 0.5121499119612144, "Yes": 0.48783263159451845}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.42515985132869805, "res": {"No": 0.5748244725029251, "Yes": 0.42515985132869805}, "ground_truth": 1}, {"key": "29508534", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6090460490056842, "res": {"Yes": 0.6090460490056842, "No": 0.39094128363688907}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5285689598341935, "res": {"Yes": 0.5285689598341935, "No": 0.4714137596503328}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5936049192601377, "res": {"Yes": 0.5936049192601377, "No": 0.40636836409594085}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8120545023112578, "res": {"Yes": 0.8120545023112578, "No": 0.18792045826818646}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8544000433831921, "res": {"Yes": 0.8544000433831921, "No": 0.14558046808296554}, "ground_truth": 1}, {"key": "15631612", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8983266087110916, "res": {"Yes": 0.8983266087110916, "No": 0.1016506850122841}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6093453712198693, "res": {"Yes": 0.6093453712198693, "No": 0.3906286947407042}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.35933973533817815, "res": {"No": 0.6406399886576841, "Yes": 0.35933973533817815}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7323428209676585, "res": {"Yes": 0.7323428209676585, "No": 0.26763306421734184}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7911213971352938, "res": {"Yes": 0.7911213971352938, "No": 0.2088568478941992}, "ground_truth": 1}, {"key": "40731892", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6711849275873542, "res": {"Yes": 0.6711849275873542, "No": 0.3287888919427164}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7310042538712312, "res": {"Yes": 0.7310042538712312, "No": 0.2689763288748523}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.571660531601622, "res": {"Yes": 0.571660531601622, "No": 0.4283164874520706}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5670794282320712, "res": {"Yes": 0.5670794282320712, "No": 0.4328949457203617}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6619705105727123, "res": {"Yes": 0.6619705105727123, "No": 0.3380027998342982}, "ground_truth": 1}, {"key": "35971910", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5814138321690089, "res": {"Yes": 0.5814138321690089, "No": 0.41856267048550855}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6625543147195262, "res": {"Yes": 0.6625543147195262, "No": 0.3374244653797966}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3008364251467205, "res": {"No": 0.6991481804611909, "Yes": 0.3008364251467205}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.47603697937768963, "res": {"No": 0.5239374091408943, "Yes": 0.47603697937768963}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4463807016144297, "res": {"No": 0.5536004288622818, "Yes": 0.4463807016144297}, "ground_truth": 1}, {"key": "34428424", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4827082572892092, "res": {"No": 0.517269170859148, "Yes": 0.4827082572892092}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.0791910651728335, "res": {"No": 0.9207958302352078, "Yes": 0.0791910651728335}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44970427900826004, "res": {"No": 0.5502781782401828, "Yes": 0.44970427900826004}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.36787506343213994, "res": {"No": 0.6321020034465801, "Yes": 0.36787506343213994}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4816771175516656, "res": {"No": 0.5183010644786237, "Yes": 0.4816771175516656}, "ground_truth": 1}, {"key": "36971005", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5468144215657422, "res": {"Yes": 0.5468144215657422, "No": 0.45316168348203606}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.16658348230383366, "res": {"No": 0.8333957496656579, "Yes": 0.16658348230383366}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6009301945668274, "res": {"Yes": 0.6009301945668274, "No": 0.399016009035973}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7565060488118764, "res": {"Yes": 0.7565060488118764, "No": 0.24345705926458783}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.658327237402281, "res": {"Yes": 0.658327237402281, "No": 0.34163078537745706}, "ground_truth": 1}, {"key": "34649067", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7566805267892028, "res": {"Yes": 0.7566805267892028, "No": 0.24327830570983724}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8387765390538308, "res": {"Yes": 0.8387765390538308, "No": 0.16119028781681674}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.19179574525818352, "res": {"No": 0.808177432411267, "Yes": 0.19179574525818352}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5858334176730853, "res": {"Yes": 0.5858334176730853, "No": 0.41413251575864435}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6438198938029598, "res": {"Yes": 0.6438198938029598, "No": 0.3561375308931333}, "ground_truth": 1}, {"key": "37355154", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.46754820185323126, "res": {"No": 0.5324303117051843, "Yes": 0.46754820185323126}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5177435689152025, "res": {"Yes": 0.5177435689152025, "No": 0.4822137492779663}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.29079657827039357, "res": {"No": 0.7091906774727276, "Yes": 0.29079657827039357}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3867597421730257, "res": {"No": 0.613215484712391, "Yes": 0.3867597421730257}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.554086093987104, "res": {"Yes": 0.554086093987104, "No": 0.44588524423094317}, "ground_truth": 1}, {"key": "38674697", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5339606136243041, "res": {"Yes": 0.5339606136243041, "No": 0.4660210845801057}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5093159643053408, "res": {"Yes": 0.5093159643053408, "No": 0.490663707151598}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.28161274401138814, "res": {"No": 0.7183214271377452, "Yes": 0.28161274401138814}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3550782468969668, "res": {"No": 0.644867357900778, "Yes": 0.3550782468969668}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.693496296183989, "res": {"Yes": 0.693496296183989, "No": 0.30646371978260245}, "ground_truth": 1}, {"key": "40525767", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6940016784239104, "res": {"Yes": 0.6940016784239104, "No": 0.305956727631031}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.637591693086423, "res": {"Yes": 0.637591693086423, "No": 0.36236633634796434}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4198719311656995, "res": {"No": 0.5800939185593971, "Yes": 0.4198719311656995}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.45062375219538253, "res": {"No": 0.5493384351150263, "Yes": 0.45062375219538253}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3846750604088648, "res": {"No": 0.6152837718215297, "Yes": 0.3846750604088648}, "ground_truth": 1}, {"key": "27165110", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.41541527351695107, "res": {"No": 0.5845491866163736, "Yes": 0.41541527351695107}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3578066579712553, "res": {"No": 0.6421672469184763, "Yes": 0.3578066579712553}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7286698355820526, "res": {"Yes": 0.7286698355820526, "No": 0.27130476388459535}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7386307681787736, "res": {"Yes": 0.7386307681787736, "No": 0.26134032338784}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6832856557671833, "res": {"Yes": 0.6832856557671833, "No": 0.3166815766519602}, "ground_truth": 1}, {"key": "35497491", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6992569903673135, "res": {"Yes": 0.6992569903673135, "No": 0.30071569363810147}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6459855977194483, "res": {"Yes": 0.6459855977194483, "No": 0.35399453635248385}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6054884265769411, "res": {"Yes": 0.6054884265769411, "No": 0.39448384109660123}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6210772056861089, "res": {"Yes": 0.6210772056861089, "No": 0.378908851570218}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6443795906797594, "res": {"Yes": 0.6443795906797594, "No": 0.355580007073806}, "ground_truth": 1}, {"key": "40690716", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.702613095989127, "res": {"Yes": 0.702613095989127, "No": 0.2973695016938432}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4868467145317924, "res": {"No": 0.5131329272141326, "Yes": 0.4868467145317924}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.12750623673644798, "res": {"No": 0.8724644680786219, "Yes": 0.12750623673644798}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.38055972860681947, "res": {"No": 0.6194083504621036, "Yes": 0.38055972860681947}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5227143709262574, "res": {"Yes": 0.5227143709262574, "No": 0.4772476692962708}, "ground_truth": 1}, {"key": "34835193", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4203551625185408, "res": {"No": 0.5796018364861489, "Yes": 0.4203551625185408}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3597494363494155, "res": {"No": 0.6402239768649503, "Yes": 0.3597494363494155}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.09275220538884268, "res": {"No": 0.9072366207821592, "Yes": 0.09275220538884268}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7316291054306451, "res": {"Yes": 0.7316291054306451, "No": 0.26833679223446133}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.47861256509380196, "res": {"No": 0.5213625009480277, "Yes": 0.47861256509380196}, "ground_truth": 1}, {"key": "39471712", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5545036664724279, "res": {"Yes": 0.5545036664724279, "No": 0.4454712359163808}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.712600609850753, "res": {"Yes": 0.712600609850753, "No": 0.28737241245806444}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3140600089586651, "res": {"No": 0.6859164991641178, "Yes": 0.3140600089586651}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.41937477825812364, "res": {"No": 0.5805996094836987, "Yes": 0.41937477825812364}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5363029351743162, "res": {"Yes": 0.5363029351743162, "No": 0.4636705038612058}, "ground_truth": 1}, {"key": "39115192", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.518369821675047, "res": {"Yes": 0.518369821675047, "No": 0.4816068989634061}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6187932614799506, "res": {"Yes": 0.6187932614799506, "No": 0.3811693059452389}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3157708142160533, "res": {"No": 0.684211683799071, "Yes": 0.3157708142160533}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6729729118492381, "res": {"Yes": 0.6729729118492381, "No": 0.3270026186542422}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7112983620505954, "res": {"Yes": 0.7112983620505954, "No": 0.2886777110012867}, "ground_truth": 1}, {"key": "23520673", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5458431748739303, "res": {"Yes": 0.5458431748739303, "No": 0.4541350582720523}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7375145958359505, "res": {"Yes": 0.7375145958359505, "No": 0.26246382919177647}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6481205927639121, "res": {"Yes": 0.6481205927639121, "No": 0.35184716078236183}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6633018721341427, "res": {"Yes": 0.6633018721341427, "No": 0.336668605136611}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7840729848842545, "res": {"Yes": 0.7840729848842545, "No": 0.21590588151162107}, "ground_truth": 1}, {"key": "35764233", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.557360656715533, "res": {"Yes": 0.557360656715533, "No": 0.4426106010011858}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7997117569913643, "res": {"Yes": 0.7997117569913643, "No": 0.20026283504130607}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5268996531770921, "res": {"Yes": 0.5268996531770921, "No": 0.47307885117355436}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.30379577381305284, "res": {"No": 0.6961811357452385, "Yes": 0.30379577381305284}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6772275143302541, "res": {"Yes": 0.6772275143302541, "No": 0.32273655750212255}, "ground_truth": 1}, {"key": "35228910", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.695913213270135, "res": {"Yes": 0.695913213270135, "No": 0.3040364449675018}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6288785029508264, "res": {"Yes": 0.6288785029508264, "No": 0.3710825479171546}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5278005040032763, "res": {"Yes": 0.5278005040032763, "No": 0.47218156299491304}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.484892675578184, "res": {"No": 0.5150906110542679, "Yes": 0.484892675578184}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4775861101152099, "res": {"No": 0.5223901272660966, "Yes": 0.4775861101152099}, "ground_truth": 1}, {"key": "36795599", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5444497975681196, "res": {"Yes": 0.5444497975681196, "No": 0.4555343288130401}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.402355038415161, "res": {"No": 0.5976029552370322, "Yes": 0.402355038415161}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3824208022863845, "res": {"No": 0.6175641804064954, "Yes": 0.3824208022863845}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7412743939531712, "res": {"Yes": 0.7412743939531712, "No": 0.25870835350357846}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7507524115019851, "res": {"Yes": 0.7507524115019851, "No": 0.24922773552689814}, "ground_truth": 1}, {"key": "38641949", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.635091624466432, "res": {"Yes": 0.635091624466432, "No": 0.3648896134662736}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7729698770820577, "res": {"Yes": 0.7729698770820577, "No": 0.22701293062893724}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6331225523303056, "res": {"Yes": 0.6331225523303056, "No": 0.3668609813870064}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5711958690718403, "res": {"Yes": 0.5711958690718403, "No": 0.4287886666336891}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5662270346029121, "res": {"Yes": 0.5662270346029121, "No": 0.43375479197548344}, "ground_truth": 1}, {"key": "29968443", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4526445406487428, "res": {"No": 0.5473385974124433, "Yes": 0.4526445406487428}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5753994981735612, "res": {"Yes": 0.5753994981735612, "No": 0.4245798021365448}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6445093366831941, "res": {"Yes": 0.6445093366831941, "No": 0.3554725670306765}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7225908449100847, "res": {"Yes": 0.7225908449100847, "No": 0.2773900889805859}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5678629355684522, "res": {"Yes": 0.5678629355684522, "No": 0.4321227273483993}, "ground_truth": 1}, {"key": "21268042", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4708142341921784, "res": {"No": 0.5291629132391109, "Yes": 0.4708142341921784}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6936812346913096, "res": {"Yes": 0.6936812346913096, "No": 0.3062976308225884}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4659785387973281, "res": {"No": 0.53400456039119, "Yes": 0.4659785387973281}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6758872545899438, "res": {"Yes": 0.6758872545899438, "No": 0.32409204954682264}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7661926036891833, "res": {"Yes": 0.7661926036891833, "No": 0.2337727241321162}, "ground_truth": 1}, {"key": "26808572", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.699571530943314, "res": {"Yes": 0.699571530943314, "No": 0.3004065965837113}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7423781496410894, "res": {"Yes": 0.7423781496410894, "No": 0.25759216515124944}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4669547364969843, "res": {"No": 0.5330258270428012, "Yes": 0.4669547364969843}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6046615191462269, "res": {"Yes": 0.6046615191462269, "No": 0.39531350315662894}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6266641674161015, "res": {"Yes": 0.6266641674161015, "No": 0.3733085834085739}, "ground_truth": 1}, {"key": "37829390", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3940282388674993, "res": {"No": 0.6059483848834144, "Yes": 0.3940282388674993}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.32166913267290814, "res": {"No": 0.6783083234907878, "Yes": 0.32166913267290814}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5517541844025063, "res": {"Yes": 0.5517541844025063, "No": 0.4482206121231297}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6565071265032713, "res": {"Yes": 0.6565071265032713, "No": 0.34346770129291915}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5884345049376357, "res": {"Yes": 0.5884345049376357, "No": 0.41154243971629495}, "ground_truth": 1}, {"key": "35716045", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.40189520838665793, "res": {"No": 0.5980858939369522, "Yes": 0.40189520838665793}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5699022067375327, "res": {"Yes": 0.5699022067375327, "No": 0.430070728042819}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4333522592335518, "res": {"No": 0.5666291758836193, "Yes": 0.4333522592335518}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.37378332289653604, "res": {"No": 0.6261925545825153, "Yes": 0.37378332289653604}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.27901752095798266, "res": {"No": 0.7209636060622323, "Yes": 0.27901752095798266}, "ground_truth": 1}, {"key": "34367070", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.25923139478058455, "res": {"No": 0.7407442536752471, "Yes": 0.25923139478058455}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.308977011899221, "res": {"No": 0.6910049788211335, "Yes": 0.308977011899221}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4740169018554021, "res": {"No": 0.5259393379428274, "Yes": 0.4740169018554021}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.48685086735197913, "res": {"No": 0.5131177130483918, "Yes": 0.48685086735197913}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.500296263017092, "res": {"Yes": 0.500296263017092, "No": 0.4996582821043239}, "ground_truth": 1}, {"key": "35239748", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3754760092370391, "res": {"No": 0.6244868415592357, "Yes": 0.3754760092370391}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.18309526277021887, "res": {"No": 0.8168750936168625, "Yes": 0.18309526277021887}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6881086720232307, "res": {"Yes": 0.6881086720232307, "No": 0.31186508642362776}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6285369763408942, "res": {"Yes": 0.6285369763408942, "No": 0.37144454469666643}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7388740984530593, "res": {"Yes": 0.7388740984530593, "No": 0.26110198522318584}, "ground_truth": 1}, {"key": "40421370", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8046606606512634, "res": {"Yes": 0.8046606606512634, "No": 0.1953215703378371}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6375062678986546, "res": {"Yes": 0.6375062678986546, "No": 0.3624705316470209}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.10451224890964335, "res": {"No": 0.8954700616800269, "Yes": 0.10451224890964335}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7318376933520631, "res": {"Yes": 0.7318376933520631, "No": 0.2681293407911609}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6181918270074702, "res": {"Yes": 0.6181918270074702, "No": 0.38178499849095293}, "ground_truth": 1}, {"key": "37288396", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6347100046453164, "res": {"Yes": 0.6347100046453164, "No": 0.36526272127685183}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6967128730072493, "res": {"Yes": 0.6967128730072493, "No": 0.3032662337581587}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6292287348346339, "res": {"Yes": 0.6292287348346339, "No": 0.370752112526207}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5197934280930587, "res": {"Yes": 0.5197934280930587, "No": 0.48018232665786537}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4816712748436658, "res": {"No": 0.5183125449743479, "Yes": 0.4816712748436658}, "ground_truth": 1}, {"key": "38903688", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6116431834979597, "res": {"Yes": 0.6116431834979597, "No": 0.3883356639812503}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5638133849412187, "res": {"Yes": 0.5638133849412187, "No": 0.43616761998848863}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3086515834224616, "res": {"No": 0.69132859692864, "Yes": 0.3086515834224616}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4058026058897605, "res": {"No": 0.5941707993251724, "Yes": 0.4058026058897605}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6027805975243843, "res": {"Yes": 0.6027805975243843, "No": 0.3971928293381035}, "ground_truth": 1}, {"key": "28071228", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3915858354285558, "res": {"No": 0.608394334968789, "Yes": 0.3915858354285558}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.66005233608964, "res": {"Yes": 0.66005233608964, "No": 0.3399246512168651}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6134178669472449, "res": {"Yes": 0.6134178669472449, "No": 0.38655914325864404}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7243486077966369, "res": {"Yes": 0.7243486077966369, "No": 0.27562583591153805}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6122240920566768, "res": {"Yes": 0.6122240920566768, "No": 0.38774853699311834}, "ground_truth": 1}, {"key": "36855834", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7702987903397138, "res": {"Yes": 0.7702987903397138, "No": 0.2296784480963744}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6453654845206666, "res": {"Yes": 0.6453654845206666, "No": 0.35460304437535217}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4742924331249272, "res": {"No": 0.525690259477336, "Yes": 0.4742924331249272}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4574147501955933, "res": {"No": 0.5425618233328087, "Yes": 0.4574147501955933}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5470508605427878, "res": {"Yes": 0.5470508605427878, "No": 0.45292807995485135}, "ground_truth": 1}, {"key": "40548717", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.521500054518296, "res": {"Yes": 0.521500054518296, "No": 0.47847409858170076}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.47169405128348985, "res": {"No": 0.5282813644467975, "Yes": 0.47169405128348985}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6541817375278016, "res": {"Yes": 0.6541817375278016, "No": 0.3458016618264462}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7457336202191003, "res": {"Yes": 0.7457336202191003, "No": 0.2542433753619001}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8389429939967562, "res": {"Yes": 0.8389429939967562, "No": 0.16104370358423947}, "ground_truth": 1}, {"key": "37051175", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8793264871986305, "res": {"Yes": 0.8793264871986305, "No": 0.12065797364929777}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6972662269216917, "res": {"Yes": 0.6972662269216917, "No": 0.3027162139405457}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6781987651960082, "res": {"Yes": 0.6781987651960082, "No": 0.32178099647673386}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8144777489296009, "res": {"Yes": 0.8144777489296009, "No": 0.1854918747093347}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.568523761404054, "res": {"Yes": 0.568523761404054, "No": 0.4314554147434807}, "ground_truth": 1}, {"key": "38882119", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7834415430411255, "res": {"Yes": 0.7834415430411255, "No": 0.21653380511727563}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6931865528411537, "res": {"Yes": 0.6931865528411537, "No": 0.3067781902064801}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5219517125874803, "res": {"Yes": 0.5219517125874803, "No": 0.4780324938669425}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.707215719574939, "res": {"Yes": 0.707215719574939, "No": 0.2927643967756255}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.635188673881037, "res": {"Yes": 0.635188673881037, "No": 0.3647894650133811}, "ground_truth": 1}, {"key": "19485402", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7465242780699425, "res": {"Yes": 0.7465242780699425, "No": 0.25344815338619187}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5188811085484175, "res": {"Yes": 0.5188811085484175, "No": 0.48109539602816376}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6041105306647826, "res": {"Yes": 0.6041105306647826, "No": 0.39586206464866264}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5747826383001815, "res": {"Yes": 0.5747826383001815, "No": 0.4251800001314746}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6308826994484423, "res": {"Yes": 0.6308826994484423, "No": 0.3690724177986729}, "ground_truth": 1}, {"key": "36060907", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.79669509441119, "res": {"Yes": 0.79669509441119, "No": 0.20325616477863473}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4532772091182724, "res": {"No": 0.5466826333013277, "Yes": 0.4532772091182724}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.22582595206806427, "res": {"No": 0.7741450034347139, "Yes": 0.22582595206806427}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5310431496131415, "res": {"Yes": 0.5310431496131415, "No": 0.4689246895885084}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.41281880958406725, "res": {"No": 0.5871424582071169, "Yes": 0.41281880958406725}, "ground_truth": 1}, {"key": "24037309", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4903229859621132, "res": {"No": 0.5096286987915186, "Yes": 0.4903229859621132}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.36594618203974355, "res": {"No": 0.6340119031732117, "Yes": 0.36594618203974355}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5201876328953468, "res": {"Yes": 0.5201876328953468, "No": 0.4797826932431668}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5827488351225334, "res": {"Yes": 0.5827488351225334, "No": 0.4172223441012462}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4128316071655258, "res": {"No": 0.587130421910096, "Yes": 0.4128316071655258}, "ground_truth": 1}, {"key": "35605805", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.48475369616467384, "res": {"No": 0.5152200438296068, "Yes": 0.48475369616467384}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3864378600298234, "res": {"No": 0.6135272061571452, "Yes": 0.3864378600298234}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3227869083323555, "res": {"No": 0.6771988004923841, "Yes": 0.3227869083323555}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.48901241562666525, "res": {"No": 0.5109687424618197, "Yes": 0.48901241562666525}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3935387424246476, "res": {"No": 0.6064378069766897, "Yes": 0.3935387424246476}, "ground_truth": 1}, {"key": "17706248", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5855283950639429, "res": {"Yes": 0.5855283950639429, "No": 0.41444541577094346}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6735436597942793, "res": {"Yes": 0.6735436597942793, "No": 0.3264370993914515}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5815835134805352, "res": {"Yes": 0.5815835134805352, "No": 0.41839902355236713}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8012730528928628, "res": {"Yes": 0.8012730528928628, "No": 0.19870382092335845}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8080039919023826, "res": {"Yes": 0.8080039919023826, "No": 0.19197525413005578}, "ground_truth": 1}, {"key": "36883559", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7717354801232903, "res": {"Yes": 0.7717354801232903, "No": 0.2282412033020019}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4934912257015977, "res": {"No": 0.5064839874042246, "Yes": 0.4934912257015977}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3530370394263329, "res": {"No": 0.6469473457120374, "Yes": 0.3530370394263329}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5930564029029531, "res": {"Yes": 0.5930564029029531, "No": 0.40691385679815933}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4816535496668968, "res": {"No": 0.5183201745911638, "Yes": 0.4816535496668968}, "ground_truth": 1}, {"key": "32799471", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7217481165518725, "res": {"Yes": 0.7217481165518725, "No": 0.2782257623716683}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.60283358426764, "res": {"Yes": 0.60283358426764, "No": 0.3971398473486471}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3838244854588183, "res": {"No": 0.61616038751272, "Yes": 0.3838244854588183}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.820303783210531, "res": {"Yes": 0.820303783210531, "No": 0.17967448175114198}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8722684124456626, "res": {"Yes": 0.8722684124456626, "No": 0.1277129003875647}, "ground_truth": 1}, {"key": "34797243", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.927565075219553, "res": {"Yes": 0.927565075219553, "No": 0.07241235101573544}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7812828350114935, "res": {"Yes": 0.7812828350114935, "No": 0.21869478435137552}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.38366154817632553, "res": {"No": 0.6163077475645883, "Yes": 0.38366154817632553}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.64394662290546, "res": {"Yes": 0.64394662290546, "No": 0.3560235495131875}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6743871003987753, "res": {"Yes": 0.6743871003987753, "No": 0.3255809350025639}, "ground_truth": 1}, {"key": "32154876", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7390632079200642, "res": {"Yes": 0.7390632079200642, "No": 0.2609088934079869}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8451408323577386, "res": {"Yes": 0.8451408323577386, "No": 0.1548293401396957}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4328387163190913, "res": {"No": 0.5671485027129805, "Yes": 0.4328387163190913}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7505161793848159, "res": {"Yes": 0.7505161793848159, "No": 0.24945792881320805}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6785962857826447, "res": {"Yes": 0.6785962857826447, "No": 0.3213603499390921}, "ground_truth": 1}, {"key": "37962274", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6943103348871843, "res": {"Yes": 0.6943103348871843, "No": 0.3056674905598097}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6776920349303227, "res": {"Yes": 0.6776920349303227, "No": 0.3222779844907546}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6190575302414603, "res": {"Yes": 0.6190575302414603, "No": 0.3809271993251068}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5997349928008456, "res": {"Yes": 0.5997349928008456, "No": 0.40024640861501415}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6251591010256579, "res": {"Yes": 0.6251591010256579, "No": 0.3748220870967523}, "ground_truth": 1}, {"key": "35574030", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5861460431868546, "res": {"Yes": 0.5861460431868546, "No": 0.41383698033925814}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6038734034215673, "res": {"Yes": 0.6038734034215673, "No": 0.3961084070559417}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.32233222844004467, "res": {"No": 0.6776471596496066, "Yes": 0.32233222844004467}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4027031455522133, "res": {"No": 0.5972547378693885, "Yes": 0.4027031455522133}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3380635443951637, "res": {"No": 0.6619114455792777, "Yes": 0.3380635443951637}, "ground_truth": 1}, {"key": "39105949", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6287952701006473, "res": {"Yes": 0.6287952701006473, "No": 0.3711700557874629}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6617047298247647, "res": {"Yes": 0.6617047298247647, "No": 0.338259136909144}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4030902285145062, "res": {"No": 0.596892290374506, "Yes": 0.4030902285145062}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3349030138396055, "res": {"No": 0.6650796041511249, "Yes": 0.3349030138396055}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5516794378090522, "res": {"Yes": 0.5516794378090522, "No": 0.44830350922577394}, "ground_truth": 1}, {"key": "41064322", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.43188611421300854, "res": {"No": 0.5680913759774247, "Yes": 0.43188611421300854}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5662756699315284, "res": {"Yes": 0.5662756699315284, "No": 0.4337018771187343}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.46179604796102314, "res": {"No": 0.5381793554149569, "Yes": 0.46179604796102314}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7528862914165134, "res": {"Yes": 0.7528862914165134, "No": 0.24708882292832302}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6109108737052794, "res": {"Yes": 0.6109108737052794, "No": 0.38906439858645037}, "ground_truth": 1}, {"key": "28105101", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6515570298657747, "res": {"Yes": 0.6515570298657747, "No": 0.3484129028858415}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6333051838728774, "res": {"Yes": 0.6333051838728774, "No": 0.36665339682351455}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5709327055209826, "res": {"Yes": 0.5709327055209826, "No": 0.4290491490784243}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.700389640159355, "res": {"Yes": 0.700389640159355, "No": 0.2995910802435693}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6927627295638055, "res": {"Yes": 0.6927627295638055, "No": 0.30720352597232303}, "ground_truth": 1}, {"key": "36036068", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7381695782135913, "res": {"Yes": 0.7381695782135913, "No": 0.2618055568965329}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7962496752063183, "res": {"Yes": 0.7962496752063183, "No": 0.20372844986269528}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.33130688106521233, "res": {"No": 0.6686777392955103, "Yes": 0.33130688106521233}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5907202818371303, "res": {"Yes": 0.5907202818371303, "No": 0.4092502302976827}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7422398055173384, "res": {"Yes": 0.7422398055173384, "No": 0.25773336434279726}, "ground_truth": 1}, {"key": "37991460", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.744654043200043, "res": {"Yes": 0.744654043200043, "No": 0.2553292219660329}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5925235262559775, "res": {"Yes": 0.5925235262559775, "No": 0.4074448308026122}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2990422533570912, "res": {"No": 0.7009425147123909, "Yes": 0.2990422533570912}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5514395259849939, "res": {"Yes": 0.5514395259849939, "No": 0.44853525235660896}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5671683248995409, "res": {"Yes": 0.5671683248995409, "No": 0.43280924100615575}, "ground_truth": 1}, {"key": "38437830", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.368303519318925, "res": {"No": 0.6316769124675604, "Yes": 0.368303519318925}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4901979156191903, "res": {"No": 0.509778658709762, "Yes": 0.4901979156191903}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5069580857058614, "res": {"Yes": 0.5069580857058614, "No": 0.493017553547642}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3616437021684846, "res": {"No": 0.6383283773552334, "Yes": 0.3616437021684846}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.49612594158606654, "res": {"No": 0.5038494076015956, "Yes": 0.49612594158606654}, "ground_truth": 1}, {"key": "36507138", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5734524028589414, "res": {"Yes": 0.5734524028589414, "No": 0.4265212027165079}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5422204965871102, "res": {"Yes": 0.5422204965871102, "No": 0.45775605855703955}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5014704482681707, "res": {"Yes": 0.5014704482681707, "No": 0.4985017594988568}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4309865309770479, "res": {"No": 0.5689912060909095, "Yes": 0.4309865309770479}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6479880980534549, "res": {"Yes": 0.6479880980534549, "No": 0.3519799377629273}, "ground_truth": 1}, {"key": "37824866", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6074844869367894, "res": {"Yes": 0.6074844869367894, "No": 0.39248262902507924}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4590041167534721, "res": {"No": 0.5409638462514782, "Yes": 0.4590041167534721}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3081314812264728, "res": {"No": 0.6918559705990693, "Yes": 0.3081314812264728}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8012447283910815, "res": {"Yes": 0.8012447283910815, "No": 0.1987354769633682}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5188613395547835, "res": {"Yes": 0.5188613395547835, "No": 0.48111468834035276}, "ground_truth": 1}, {"key": "25088134", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6147799684932616, "res": {"Yes": 0.6147799684932616, "No": 0.38520261900610914}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6891652475033238, "res": {"Yes": 0.6891652475033238, "No": 0.3108160254130063}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6406268684850674, "res": {"Yes": 0.6406268684850674, "No": 0.35935773870989923}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6394425485983058, "res": {"Yes": 0.6394425485983058, "No": 0.36053714143686105}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.656560450177531, "res": {"Yes": 0.656560450177531, "No": 0.34341371241391294}, "ground_truth": 1}, {"key": "40172531", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5785785264927248, "res": {"Yes": 0.5785785264927248, "No": 0.42140399388464345}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45034093488457394, "res": {"No": 0.5496401157094354, "Yes": 0.45034093488457394}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5512270421399463, "res": {"Yes": 0.5512270421399463, "No": 0.4487585663511293}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8366047351476814, "res": {"Yes": 0.8366047351476814, "No": 0.16337513184984578}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7032238055591125, "res": {"Yes": 0.7032238055591125, "No": 0.2967539009504976}, "ground_truth": 1}, {"key": "37035874", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7184583091428065, "res": {"Yes": 0.7184583091428065, "No": 0.2815203338741366}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6916002041416781, "res": {"Yes": 0.6916002041416781, "No": 0.308382032304578}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3647645872202096, "res": {"No": 0.6352132116934537, "Yes": 0.3647645872202096}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6477847588995467, "res": {"Yes": 0.6477847588995467, "No": 0.3521850610212712}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6095913404555797, "res": {"Yes": 0.6095913404555797, "No": 0.39036991086220857}, "ground_truth": 1}, {"key": "36404465", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7367202044906808, "res": {"Yes": 0.7367202044906808, "No": 0.26324642718683494}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5859138229686118, "res": {"Yes": 0.5859138229686118, "No": 0.4140558793457221}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5374574418868412, "res": {"Yes": 0.5374574418868412, "No": 0.462526142177514}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.47532842158537203, "res": {"No": 0.5246534655231271, "Yes": 0.47532842158537203}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5343916403177708, "res": {"Yes": 0.5343916403177708, "No": 0.4655839894855035}, "ground_truth": 1}, {"key": "39602052", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5827465624065082, "res": {"Yes": 0.5827465624065082, "No": 0.41723188191304916}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.42627819753398355, "res": {"No": 0.5736976864873073, "Yes": 0.42627819753398355}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5191461168933151, "res": {"Yes": 0.5191461168933151, "No": 0.48083824712313383}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.538310310382155, "res": {"Yes": 0.538310310382155, "No": 0.46167061348517036}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5950120033157955, "res": {"Yes": 0.5950120033157955, "No": 0.4049627060268095}, "ground_truth": 1}, {"key": "33792789", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6331104218184136, "res": {"Yes": 0.6331104218184136, "No": 0.36687147376111434}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5932453629781335, "res": {"Yes": 0.5932453629781335, "No": 0.40673153107446963}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.36270933336793865, "res": {"No": 0.6372719955259312, "Yes": 0.36270933336793865}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5762531259753031, "res": {"Yes": 0.5762531259753031, "No": 0.423729711457527}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4911656379056523, "res": {"No": 0.5088198776556043, "Yes": 0.4911656379056523}, "ground_truth": 1}, {"key": "32776626", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.748591101827824, "res": {"Yes": 0.748591101827824, "No": 0.25139021641282994}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45770242184473425, "res": {"No": 0.5422789944896022, "Yes": 0.45770242184473425}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4195765460477291, "res": {"No": 0.5804049438520651, "Yes": 0.4195765460477291}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7503190371760783, "res": {"Yes": 0.7503190371760783, "No": 0.24964656534779425}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7930738217022801, "res": {"Yes": 0.7930738217022801, "No": 0.20690461272773777}, "ground_truth": 1}, {"key": "37195090", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8005254695497412, "res": {"Yes": 0.8005254695497412, "No": 0.19944982062087804}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7677708981793098, "res": {"Yes": 0.7677708981793098, "No": 0.23220487850784777}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4408681622695532, "res": {"No": 0.5590886453251881, "Yes": 0.4408681622695532}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6495322113687486, "res": {"Yes": 0.6495322113687486, "No": 0.3504404805180413}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6038792972547464, "res": {"Yes": 0.6038792972547464, "No": 0.3960941474099628}, "ground_truth": 1}, {"key": "33981824", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6041900972610165, "res": {"Yes": 0.6041900972610165, "No": 0.3957730254922745}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6985435041338676, "res": {"Yes": 0.6985435041338676, "No": 0.30142649205104133}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3533002206772683, "res": {"No": 0.6466619819670267, "Yes": 0.3533002206772683}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5370451552605489, "res": {"Yes": 0.5370451552605489, "No": 0.4629000606144038}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3629485101845124, "res": {"No": 0.6370078691707587, "Yes": 0.3629485101845124}, "ground_truth": 1}, {"key": "39569142", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3042669006789744, "res": {"No": 0.6956945360302099, "Yes": 0.3042669006789744}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.23306970664702484, "res": {"No": 0.7668724183326652, "Yes": 0.23306970664702484}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.45000190630203496, "res": {"No": 0.5499779458577714, "Yes": 0.45000190630203496}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6855263099810159, "res": {"Yes": 0.6855263099810159, "No": 0.3144494333592914}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6604782137798605, "res": {"Yes": 0.6604782137798605, "No": 0.33950941513890925}, "ground_truth": 1}, {"key": "40268210", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6101938655069122, "res": {"Yes": 0.6101938655069122, "No": 0.38978436617952555}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6266261112568013, "res": {"Yes": 0.6266261112568013, "No": 0.3733507323269024}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44845018674274706, "res": {"No": 0.5515305761667197, "Yes": 0.44845018674274706}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.47118946721673294, "res": {"No": 0.5287943368174616, "Yes": 0.47118946721673294}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5443036541931675, "res": {"Yes": 0.5443036541931675, "No": 0.4556796674442106}, "ground_truth": 1}, {"key": "34925159", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5649224013564611, "res": {"Yes": 0.5649224013564611, "No": 0.4350594458951377}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3421232249305401, "res": {"No": 0.6578580502717314, "Yes": 0.3421232249305401}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6493586340916488, "res": {"Yes": 0.6493586340916488, "No": 0.35062759558310963}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5953391117939938, "res": {"Yes": 0.5953391117939938, "No": 0.40463388838806824}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.55554692501266, "res": {"Yes": 0.55554692501266, "No": 0.4444294874589382}, "ground_truth": 1}, {"key": "36181903", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3890898247756897, "res": {"No": 0.6108925588718265, "Yes": 0.3890898247756897}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.38183030378678384, "res": {"No": 0.6181473002538211, "Yes": 0.38183030378678384}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6069087674258924, "res": {"Yes": 0.6069087674258924, "No": 0.39307290712718196}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.36088118581104317, "res": {"No": 0.6391025003723745, "Yes": 0.36088118581104317}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5543358547005747, "res": {"Yes": 0.5543358547005747, "No": 0.445638920568098}, "ground_truth": 1}, {"key": "38620559", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5698086706660341, "res": {"Yes": 0.5698086706660341, "No": 0.4301682963525476}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4283266558061806, "res": {"No": 0.5716533744565702, "Yes": 0.4283266558061806}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44071839393889256, "res": {"No": 0.5592623476000125, "Yes": 0.44071839393889256}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5798752411759944, "res": {"Yes": 0.5798752411759944, "No": 0.42009487515019656}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.37963079145748513, "res": {"No": 0.6203407842067064, "Yes": 0.37963079145748513}, "ground_truth": 1}, {"key": "32719657", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5200751544818999, "res": {"Yes": 0.5200751544818999, "No": 0.479889408780472}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.12839639043479062, "res": {"No": 0.8715704932760779, "Yes": 0.12839639043479062}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.20491971719238503, "res": {"No": 0.7950716520693539, "Yes": 0.20491971719238503}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5661469870834525, "res": {"Yes": 0.5661469870834525, "No": 0.4338357815552873}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6371544233169943, "res": {"Yes": 0.6371544233169943, "No": 0.36282574547033924}, "ground_truth": 1}, {"key": "37530914", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7129261787807141, "res": {"Yes": 0.7129261787807141, "No": 0.2870555006105776}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6196139538213893, "res": {"Yes": 0.6196139538213893, "No": 0.38036525140466265}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.48842793568945253, "res": {"No": 0.5115586691359408, "Yes": 0.48842793568945253}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.46782832840813926, "res": {"No": 0.5321521682469761, "Yes": 0.46782832840813926}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6443971567068252, "res": {"Yes": 0.6443971567068252, "No": 0.35558359845001386}, "ground_truth": 1}, {"key": "33306933", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.670684423761205, "res": {"Yes": 0.670684423761205, "No": 0.3292940692286282}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5913447785710932, "res": {"Yes": 0.5913447785710932, "No": 0.4086340078033515}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7785726823684203, "res": {"Yes": 0.7785726823684203, "No": 0.2213947658797337}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3644530654579364, "res": {"No": 0.6355222545527519, "Yes": 0.3644530654579364}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4600829866542738, "res": {"No": 0.5398793447702068, "Yes": 0.4600829866542738}, "ground_truth": 1}, {"key": "33837212", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.659869381741503, "res": {"Yes": 0.659869381741503, "No": 0.3400923774135755}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.33490612845211715, "res": {"No": 0.6650743766459805, "Yes": 0.33490612845211715}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44138510086486415, "res": {"No": 0.5585838429918025, "Yes": 0.44138510086486415}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6615059769620465, "res": {"Yes": 0.6615059769620465, "No": 0.33846726410721456}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.47188320549573626, "res": {"No": 0.5280961814648961, "Yes": 0.47188320549573626}, "ground_truth": 1}, {"key": "40945179", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6245601731093826, "res": {"Yes": 0.6245601731093826, "No": 0.3754141208726556}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5258550892093926, "res": {"Yes": 0.5258550892093926, "No": 0.4741236292938401}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.42689606622778287, "res": {"No": 0.573087848932767, "Yes": 0.42689606622778287}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7175199405695353, "res": {"Yes": 0.7175199405695353, "No": 0.28246255100416023}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6513383975006375, "res": {"Yes": 0.6513383975006375, "No": 0.3486409789078251}, "ground_truth": 1}, {"key": "34152358", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7942626889063299, "res": {"Yes": 0.7942626889063299, "No": 0.2057175227501912}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.726270677224479, "res": {"Yes": 0.726270677224479, "No": 0.27370913158777477}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5231388670444402, "res": {"Yes": 0.5231388670444402, "No": 0.47685331552917465}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5327701106283826, "res": {"Yes": 0.5327701106283826, "No": 0.46721525314609247}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6021803282144695, "res": {"Yes": 0.6021803282144695, "No": 0.39780438082139113}, "ground_truth": 1}, {"key": "34136541", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6779230656315993, "res": {"Yes": 0.6779230656315993, "No": 0.3220590387786744}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4600153318250379, "res": {"No": 0.539966785310399, "Yes": 0.4600153318250379}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4594285014753362, "res": {"No": 0.5405538915650046, "Yes": 0.4594285014753362}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4035282222902458, "res": {"No": 0.5964454450803494, "Yes": 0.4035282222902458}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7451645816755238, "res": {"Yes": 0.7451645816755238, "No": 0.25482536794913174}, "ground_truth": 1}, {"key": "37469603", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5808211504909768, "res": {"Yes": 0.5808211504909768, "No": 0.4191588977680003}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4809855744858566, "res": {"No": 0.518993271632247, "Yes": 0.4809855744858566}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6036277373178733, "res": {"Yes": 0.6036277373178733, "No": 0.3963492547433883}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.701236495559377, "res": {"Yes": 0.701236495559377, "No": 0.29873090323663426}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7524478703809568, "res": {"Yes": 0.7524478703809568, "No": 0.24753017133977465}, "ground_truth": 1}, {"key": "37353611", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7049736448923877, "res": {"Yes": 0.7049736448923877, "No": 0.29499994767948823}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7191452679598381, "res": {"Yes": 0.7191452679598381, "No": 0.2808317621942258}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6880177100695067, "res": {"Yes": 0.6880177100695067, "No": 0.3119594710784576}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6962911132032318, "res": {"Yes": 0.6962911132032318, "No": 0.30367807575617156}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6847952777413553, "res": {"Yes": 0.6847952777413553, "No": 0.3151805278601907}, "ground_truth": 1}, {"key": "37211649", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7099635132897641, "res": {"Yes": 0.7099635132897641, "No": 0.29001225449938023}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6337921737118264, "res": {"Yes": 0.6337921737118264, "No": 0.3661816343373731}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4868386767588875, "res": {"No": 0.513145011636862, "Yes": 0.4868386767588875}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8636488900747351, "res": {"Yes": 0.8636488900747351, "No": 0.13633825663804203}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7613937299225066, "res": {"Yes": 0.7613937299225066, "No": 0.238584484183859}, "ground_truth": 1}, {"key": "37320976", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7373400910302148, "res": {"Yes": 0.7373400910302148, "No": 0.2626415511009506}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.717395174700577, "res": {"Yes": 0.717395174700577, "No": 0.28259124200329266}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4397848451319906, "res": {"No": 0.5601903736933721, "Yes": 0.4397848451319906}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6114895335668502, "res": {"Yes": 0.6114895335668502, "No": 0.3884729649049762}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.41117523204865214, "res": {"No": 0.5887937655639333, "Yes": 0.41117523204865214}, "ground_truth": 1}, {"key": "34492412", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5671794471794458, "res": {"Yes": 0.5671794471794458, "No": 0.4327607690856413}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.31252191008232205, "res": {"No": 0.6874475453671541, "Yes": 0.31252191008232205}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4684090810799448, "res": {"No": 0.5315642256630253, "Yes": 0.4684090810799448}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5083679411374524, "res": {"Yes": 0.5083679411374524, "No": 0.49161094868821076}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4869512809601464, "res": {"No": 0.5130219434345303, "Yes": 0.4869512809601464}, "ground_truth": 1}, {"key": "36655016", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4617329432251536, "res": {"No": 0.5382413034238046, "Yes": 0.4617329432251536}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.34383864048956386, "res": {"No": 0.656142688981113, "Yes": 0.34383864048956386}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3465522423999724, "res": {"No": 0.6534282339032168, "Yes": 0.3465522423999724}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5388999536776056, "res": {"Yes": 0.5388999536776056, "No": 0.4610783471461214}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.756888430619885, "res": {"Yes": 0.756888430619885, "No": 0.24307979866056137}, "ground_truth": 1}, {"key": "35220773", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7650738376572042, "res": {"Yes": 0.7650738376572042, "No": 0.2349007956821743}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5224840614554096, "res": {"Yes": 0.5224840614554096, "No": 0.4774934673964818}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6969787057357548, "res": {"Yes": 0.6969787057357548, "No": 0.3030037491854438}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6752342576139378, "res": {"Yes": 0.6752342576139378, "No": 0.3247480591151562}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5065639016867899, "res": {"Yes": 0.5065639016867899, "No": 0.4934213029490599}, "ground_truth": 1}, {"key": "31569808", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6451877172710101, "res": {"Yes": 0.6451877172710101, "No": 0.354796249268199}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.506711941286395, "res": {"Yes": 0.506711941286395, "No": 0.49326999383988335}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6258001550403142, "res": {"Yes": 0.6258001550403142, "No": 0.37418516893010734}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7286692890798808, "res": {"Yes": 0.7286692890798808, "No": 0.271312848887025}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6638919291873954, "res": {"Yes": 0.6638919291873954, "No": 0.336086806401751}, "ground_truth": 1}, {"key": "37696256", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.503530798437554, "res": {"Yes": 0.503530798437554, "No": 0.4964566552063411}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7155865521042845, "res": {"Yes": 0.7155865521042845, "No": 0.28439214527995776}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.25137053332948756, "res": {"No": 0.7486196012335532, "Yes": 0.25137053332948756}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7031794897912906, "res": {"Yes": 0.7031794897912906, "No": 0.2967969333859116}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6214987371327803, "res": {"Yes": 0.6214987371327803, "No": 0.3784810512899309}, "ground_truth": 1}, {"key": "36874328", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6169521566373832, "res": {"Yes": 0.6169521566373832, "No": 0.3830253515329683}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4266816688446847, "res": {"No": 0.5732951493680902, "Yes": 0.4266816688446847}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7255026166350211, "res": {"Yes": 0.7255026166350211, "No": 0.2744526303376278}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6936483619165241, "res": {"Yes": 0.6936483619165241, "No": 0.3063088108901484}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6397009355785952, "res": {"Yes": 0.6397009355785952, "No": 0.3602661554501633}, "ground_truth": 1}, {"key": "24532377", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.60094361949733, "res": {"Yes": 0.60094361949733, "No": 0.3990226487176054}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7839309786056893, "res": {"Yes": 0.7839309786056893, "No": 0.21601545995359983}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.1799599235186657, "res": {"No": 0.8200147918869604, "Yes": 0.1799599235186657}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.48763505061818824, "res": {"No": 0.5123293187622647, "Yes": 0.48763505061818824}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5936825678616847, "res": {"Yes": 0.5936825678616847, "No": 0.4062920674715473}, "ground_truth": 1}, {"key": "39560618", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5977238386352844, "res": {"Yes": 0.5977238386352844, "No": 0.4022506971439586}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4351437250719824, "res": {"No": 0.5648292533327431, "Yes": 0.4351437250719824}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6315827933033561, "res": {"Yes": 0.6315827933033561, "No": 0.3684045956716675}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7525578260969459, "res": {"Yes": 0.7525578260969459, "No": 0.247429917175217}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5907763084053977, "res": {"Yes": 0.5907763084053977, "No": 0.40920943008364646}, "ground_truth": 1}, {"key": "34922693", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7302194891232694, "res": {"Yes": 0.7302194891232694, "No": 0.2697633731456232}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7831488334656334, "res": {"Yes": 0.7831488334656334, "No": 0.216835950461909}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.11533096816992269, "res": {"No": 0.8846482063059362, "Yes": 0.11533096816992269}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.40496509531382346, "res": {"No": 0.5950109917962497, "Yes": 0.40496509531382346}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4616946810015657, "res": {"No": 0.5382706383742113, "Yes": 0.4616946810015657}, "ground_truth": 1}, {"key": "33629577", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5295865135684268, "res": {"Yes": 0.5295865135684268, "No": 0.4703695107880169}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4200338818025489, "res": {"No": 0.579924880621177, "Yes": 0.4200338818025489}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5086591159759484, "res": {"Yes": 0.5086591159759484, "No": 0.4913271204139556}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7004139581098185, "res": {"Yes": 0.7004139581098185, "No": 0.29956774300741545}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8244514936039604, "res": {"Yes": 0.8244514936039604, "No": 0.17553316141397107}, "ground_truth": 1}, {"key": "32284359", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7749219998877482, "res": {"Yes": 0.7749219998877482, "No": 0.22505836734422588}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7059229382972068, "res": {"Yes": 0.7059229382972068, "No": 0.2940564568431881}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.43914267004121227, "res": {"No": 0.5608359726948838, "Yes": 0.43914267004121227}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3795777075993176, "res": {"No": 0.620397200562835, "Yes": 0.3795777075993176}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4501278794647306, "res": {"No": 0.5498444824067567, "Yes": 0.4501278794647306}, "ground_truth": 1}, {"key": "28082962", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.690994620734135, "res": {"Yes": 0.690994620734135, "No": 0.30898183197820317}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6960350226599503, "res": {"Yes": 0.6960350226599503, "No": 0.30394357602001826}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.48598180211039005, "res": {"No": 0.513990755036006, "Yes": 0.48598180211039005}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6089551252181973, "res": {"Yes": 0.6089551252181973, "No": 0.3910052312227318}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5701607160008332, "res": {"Yes": 0.5701607160008332, "No": 0.42980482443482443}, "ground_truth": 1}, {"key": "24796803", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.534108808255639, "res": {"Yes": 0.534108808255639, "No": 0.46585176328551187}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5195639899467533, "res": {"Yes": 0.5195639899467533, "No": 0.4803990049851691}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.22638524659338932, "res": {"No": 0.7736001584666016, "Yes": 0.22638524659338932}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4550173631454769, "res": {"No": 0.5449627147292598, "Yes": 0.4550173631454769}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3471022062143185, "res": {"No": 0.6528793300286959, "Yes": 0.3471022062143185}, "ground_truth": 1}, {"key": "35466150", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.47223709481192805, "res": {"No": 0.5277397576612846, "Yes": 0.47223709481192805}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3590646942157614, "res": {"No": 0.6409071720136056, "Yes": 0.3590646942157614}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.789694829439279, "res": {"Yes": 0.789694829439279, "No": 0.21028536284571964}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5128750144732234, "res": {"Yes": 0.5128750144732234, "No": 0.4871090300261315}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5567731127559993, "res": {"Yes": 0.5567731127559993, "No": 0.44320957479636913}, "ground_truth": 1}, {"key": "35754289", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5627659255974923, "res": {"Yes": 0.5627659255974923, "No": 0.4372154870698834}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.604478425131564, "res": {"Yes": 0.604478425131564, "No": 0.39550371446422916}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5073091184998852, "res": {"Yes": 0.5073091184998852, "No": 0.49267530621509303}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.49790696334649087, "res": {"No": 0.50208110931559, "Yes": 0.49790696334649087}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.42745813295902496, "res": {"No": 0.572525015106013, "Yes": 0.42745813295902496}, "ground_truth": 1}, {"key": "36678662", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5117448080363854, "res": {"Yes": 0.5117448080363854, "No": 0.4882376519354233}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.44959419138655654, "res": {"No": 0.5503911509397331, "Yes": 0.44959419138655654}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.582889038045242, "res": {"Yes": 0.582889038045242, "No": 0.41708322364911327}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.570008617412658, "res": {"Yes": 0.570008617412658, "No": 0.4299697377915826}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6687658701420266, "res": {"Yes": 0.6687658701420266, "No": 0.331217870865326}, "ground_truth": 1}, {"key": "35399671", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4983906359040015, "res": {"No": 0.5015863264015489, "Yes": 0.4983906359040015}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6181895829752111, "res": {"Yes": 0.6181895829752111, "No": 0.3817835897069077}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.16447149606358122, "res": {"No": 0.8355101688878407, "Yes": 0.16447149606358122}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.33848445868096966, "res": {"No": 0.6614878387168346, "Yes": 0.33848445868096966}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2932972438724777, "res": {"No": 0.7066754576435063, "Yes": 0.2932972438724777}, "ground_truth": 1}, {"key": "36888180", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.35714668472806693, "res": {"No": 0.6428303055967264, "Yes": 0.35714668472806693}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.33375639780440786, "res": {"No": 0.6662157579632305, "Yes": 0.33375639780440786}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5413064010073501, "res": {"Yes": 0.5413064010073501, "No": 0.45867231250140567}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6306568397194606, "res": {"Yes": 0.6306568397194606, "No": 0.369319764402615}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6872654302667724, "res": {"Yes": 0.6872654302667724, "No": 0.3127109492315753}, "ground_truth": 1}, {"key": "28061069", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.790776314064558, "res": {"Yes": 0.790776314064558, "No": 0.2091962233028453}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5513399449990347, "res": {"Yes": 0.5513399449990347, "No": 0.4486347933727742}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5966406160619204, "res": {"Yes": 0.5966406160619204, "No": 0.403335482726376}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5857284457304052, "res": {"Yes": 0.5857284457304052, "No": 0.4142518569524733}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6712568220551876, "res": {"Yes": 0.6712568220551876, "No": 0.3287200507566673}, "ground_truth": 1}, {"key": "22259982", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7682179477202856, "res": {"Yes": 0.7682179477202856, "No": 0.23176512786748488}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.666740076113523, "res": {"Yes": 0.666740076113523, "No": 0.3332262134383995}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5135309904616664, "res": {"Yes": 0.5135309904616664, "No": 0.48644346096935304}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4790185958935738, "res": {"No": 0.5209584973493193, "Yes": 0.4790185958935738}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5165042820209421, "res": {"Yes": 0.5165042820209421, "No": 0.4834685561594295}, "ground_truth": 1}, {"key": "34026805", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.29325905905721095, "res": {"No": 0.7067183117425809, "Yes": 0.29325905905721095}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.28618082863640504, "res": {"No": 0.7138010977724779, "Yes": 0.28618082863640504}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7320388739074349, "res": {"Yes": 0.7320388739074349, "No": 0.26791315486438394}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6570257026696222, "res": {"Yes": 0.6570257026696222, "No": 0.34292695969086273}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6605299246434126, "res": {"Yes": 0.6605299246434126, "No": 0.3394161647111032}, "ground_truth": 1}, {"key": "36713809", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6904515328357604, "res": {"Yes": 0.6904515328357604, "No": 0.30951017864976293}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7226270909759092, "res": {"Yes": 0.7226270909759092, "No": 0.27734207691174784}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.14158745447329785, "res": {"No": 0.8583950965461976, "Yes": 0.14158745447329785}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7368627220629781, "res": {"Yes": 0.7368627220629781, "No": 0.2631066015080513}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5341661051805662, "res": {"Yes": 0.5341661051805662, "No": 0.4658146596702373}, "ground_truth": 1}, {"key": "39726411", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7072294821267512, "res": {"Yes": 0.7072294821267512, "No": 0.2927449871395558}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6559584896583598, "res": {"Yes": 0.6559584896583598, "No": 0.34401424932851915}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44680004994647526, "res": {"No": 0.5531806600188293, "Yes": 0.44680004994647526}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6747043864742656, "res": {"Yes": 0.6747043864742656, "No": 0.3252709342806668}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4777304106745777, "res": {"No": 0.5222420767679711, "Yes": 0.4777304106745777}, "ground_truth": 1}, {"key": "37069841", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7113063642021804, "res": {"Yes": 0.7113063642021804, "No": 0.28867493970856334}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.0684751002360377, "res": {"No": 0.9315166357516181, "Yes": 0.0684751002360377}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6402707149211796, "res": {"Yes": 0.6402707149211796, "No": 0.3596974922812586}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7587440564374247, "res": {"Yes": 0.7587440564374247, "No": 0.2412294557263841}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7065773637653299, "res": {"Yes": 0.7065773637653299, "No": 0.29339190616601496}, "ground_truth": 1}, {"key": "38894693", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6730515667895578, "res": {"Yes": 0.6730515667895578, "No": 0.32692731862229757}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5349956301839259, "res": {"Yes": 0.5349956301839259, "No": 0.4649727580265882}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5627646312373519, "res": {"Yes": 0.5627646312373519, "No": 0.43721616475441355}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5817598763370804, "res": {"Yes": 0.5817598763370804, "No": 0.41820990810658687}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.544167976205141, "res": {"Yes": 0.544167976205141, "No": 0.45580073482793043}, "ground_truth": 1}, {"key": "33946032", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5075778199594333, "res": {"Yes": 0.5075778199594333, "No": 0.49238842118855364}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45702092563525387, "res": {"No": 0.5429525216389802, "Yes": 0.45702092563525387}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.27779420755866435, "res": {"No": 0.7221626849902657, "Yes": 0.27779420755866435}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5526898968153344, "res": {"Yes": 0.5526898968153344, "No": 0.4472601780021651}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6590181520620695, "res": {"Yes": 0.6590181520620695, "No": 0.3409348757987334}, "ground_truth": 1}, {"key": "39035311", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5966192746087781, "res": {"Yes": 0.5966192746087781, "No": 0.40333415172147913}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4554140380818908, "res": {"No": 0.5445438212769371, "Yes": 0.4554140380818908}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.40680669387085844, "res": {"No": 0.5931739405361481, "Yes": 0.40680669387085844}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5078920774185425, "res": {"Yes": 0.5078920774185425, "No": 0.4920856461986749}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.630423237248675, "res": {"Yes": 0.630423237248675, "No": 0.3695528195853276}, "ground_truth": 1}, {"key": "27680038", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5744194502302243, "res": {"Yes": 0.5744194502302243, "No": 0.42555858728526985}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.624767623988184, "res": {"Yes": 0.624767623988184, "No": 0.37521231871236727}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2010948684366034, "res": {"No": 0.7988835568052908, "Yes": 0.2010948684366034}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3721308832110965, "res": {"No": 0.6278454446804625, "Yes": 0.3721308832110965}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.34828972586236223, "res": {"No": 0.6516844999193965, "Yes": 0.34828972586236223}, "ground_truth": 1}, {"key": "36901907", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3954767815783493, "res": {"No": 0.6045064131305647, "Yes": 0.3954767815783493}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.43472366614141694, "res": {"No": 0.5652556343406296, "Yes": 0.43472366614141694}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5190596343544363, "res": {"Yes": 0.5190596343544363, "No": 0.48092507030637893}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7433467158295514, "res": {"Yes": 0.7433467158295514, "No": 0.25662831141875964}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7024832159119063, "res": {"Yes": 0.7024832159119063, "No": 0.2974926679042984}, "ground_truth": 1}, {"key": "21530542", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.782891399944183, "res": {"Yes": 0.782891399944183, "No": 0.21708701826359628}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6319231628471204, "res": {"Yes": 0.6319231628471204, "No": 0.36805305868392474}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.8511059138882339, "res": {"Yes": 0.8511059138882339, "No": 0.14886796601695548}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.31244175849226685, "res": {"No": 0.6875295627515562, "Yes": 0.31244175849226685}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.39265594836322243, "res": {"No": 0.6072892606494955, "Yes": 0.39265594836322243}, "ground_truth": 1}, {"key": "38192532", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5008600591345308, "res": {"Yes": 0.5008600591345308, "No": 0.499092983954345}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.43398647888929875, "res": {"No": 0.565970020214898, "Yes": 0.43398647888929875}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6986446046652438, "res": {"Yes": 0.6986446046652438, "No": 0.3013177871214711}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7957247932832041, "res": {"Yes": 0.7957247932832041, "No": 0.20423977657155135}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6765681887990441, "res": {"Yes": 0.6765681887990441, "No": 0.32340350303574694}, "ground_truth": 1}, {"key": "34102400", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6901316655202568, "res": {"Yes": 0.6901316655202568, "No": 0.3098386192865208}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6879395075411281, "res": {"Yes": 0.6879395075411281, "No": 0.31202873376891116}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6869640892225687, "res": {"Yes": 0.6869640892225687, "No": 0.31301774398527565}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7413209029676203, "res": {"Yes": 0.7413209029676203, "No": 0.258651547386689}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7280989279328588, "res": {"Yes": 0.7280989279328588, "No": 0.2718823888851208}, "ground_truth": 1}, {"key": "36133399", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7237547044589967, "res": {"Yes": 0.7237547044589967, "No": 0.27622578116068064}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5914878954097832, "res": {"Yes": 0.5914878954097832, "No": 0.40849675843549094}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5279982339886157, "res": {"Yes": 0.5279982339886157, "No": 0.47198019689862486}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6113778674304385, "res": {"Yes": 0.6113778674304385, "No": 0.3885909620613791}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6041560460667065, "res": {"Yes": 0.6041560460667065, "No": 0.3958126047737548}, "ground_truth": 1}, {"key": "34314544", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6275858968086209, "res": {"Yes": 0.6275858968086209, "No": 0.3723859360504776}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6105158826274519, "res": {"Yes": 0.6105158826274519, "No": 0.3894533615974291}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.29047734266511177, "res": {"No": 0.7095101476126245, "Yes": 0.29047734266511177}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7674961007421074, "res": {"Yes": 0.7674961007421074, "No": 0.23247843754440548}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5719227781216109, "res": {"Yes": 0.5719227781216109, "No": 0.4280498149941086}, "ground_truth": 1}, {"key": "33460074", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6995804155581743, "res": {"Yes": 0.6995804155581743, "No": 0.30040239092079885}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6614494404623172, "res": {"Yes": 0.6614494404623172, "No": 0.33852548548353584}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3997298240345847, "res": {"No": 0.6002372411500372, "Yes": 0.3997298240345847}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7326829413425258, "res": {"Yes": 0.7326829413425258, "No": 0.2672838437635806}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4811591935073565, "res": {"No": 0.5188054404453989, "Yes": 0.4811591935073565}, "ground_truth": 1}, {"key": "36191495", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5648071124599764, "res": {"Yes": 0.5648071124599764, "No": 0.435162349621978}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7829627950661551, "res": {"Yes": 0.7829627950661551, "No": 0.21700039612120559}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5881033389567715, "res": {"Yes": 0.5881033389567715, "No": 0.41188234121230854}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7378763321764322, "res": {"Yes": 0.7378763321764322, "No": 0.26209868128721014}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7680328295025263, "res": {"Yes": 0.7680328295025263, "No": 0.23194451393346702}, "ground_truth": 1}, {"key": "39532668", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8124624591246226, "res": {"Yes": 0.8124624591246226, "No": 0.18751705081992265}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7230753816127536, "res": {"Yes": 0.7230753816127536, "No": 0.27690186875047157}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.10423055067261199, "res": {"No": 0.8957502354005098, "Yes": 0.10423055067261199}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5177442212725103, "res": {"Yes": 0.5177442212725103, "No": 0.4822336651170707}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6579051545944454, "res": {"Yes": 0.6579051545944454, "No": 0.3420687974552741}, "ground_truth": 1}, {"key": "20328247", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5400682275986881, "res": {"Yes": 0.5400682275986881, "No": 0.45991488004595193}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5690178070515868, "res": {"Yes": 0.5690178070515868, "No": 0.4309647408489008}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5701941854171801, "res": {"Yes": 0.5701941854171801, "No": 0.4297776057571815}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6351641433681389, "res": {"Yes": 0.6351641433681389, "No": 0.3648087628865046}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8382512688061688, "res": {"Yes": 0.8382512688061688, "No": 0.16172723457818652}, "ground_truth": 1}, {"key": "39112675", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8030369589539185, "res": {"Yes": 0.8030369589539185, "No": 0.19692935866660297}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.44563150074184077, "res": {"No": 0.5543499017491081, "Yes": 0.44563150074184077}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.27501891551229, "res": {"No": 0.7249695536317255, "Yes": 0.27501891551229}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.46474469833911597, "res": {"No": 0.5352240364617137, "Yes": 0.46474469833911597}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6158492311700413, "res": {"Yes": 0.6158492311700413, "No": 0.38413366539364685}, "ground_truth": 1}, {"key": "31620300", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6668965116845543, "res": {"Yes": 0.6668965116845543, "No": 0.33306990037296696}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5875436722393694, "res": {"Yes": 0.5875436722393694, "No": 0.4124309422292749}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3242978160637665, "res": {"No": 0.6756832620534158, "Yes": 0.3242978160637665}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7014672262925034, "res": {"Yes": 0.7014672262925034, "No": 0.2985192974993677}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7903141929443288, "res": {"Yes": 0.7903141929443288, "No": 0.20966778019876633}, "ground_truth": 1}, {"key": "37518509", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6844621921757934, "res": {"Yes": 0.6844621921757934, "No": 0.3155112941559215}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5000825470932454, "res": {"Yes": 0.5000825470932454, "No": 0.49989278177736357}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2714633878724303, "res": {"No": 0.7285162117435824, "Yes": 0.2714633878724303}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7781879990280735, "res": {"Yes": 0.7781879990280735, "No": 0.22178567308454528}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6367599239041293, "res": {"Yes": 0.6367599239041293, "No": 0.36321646504821165}, "ground_truth": 1}, {"key": "35454095", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.669050544092515, "res": {"Yes": 0.669050544092515, "No": 0.33091673206867445}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6755785122408824, "res": {"Yes": 0.6755785122408824, "No": 0.32439473072953634}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7982397404677999, "res": {"Yes": 0.7982397404677999, "No": 0.20174115786089072}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6681743075754972, "res": {"Yes": 0.6681743075754972, "No": 0.33180149351007937}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7131395396015778, "res": {"Yes": 0.7131395396015778, "No": 0.2868359871272233}, "ground_truth": 1}, {"key": "38542788", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6626368542513789, "res": {"Yes": 0.6626368542513789, "No": 0.33733974873315986}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6964215894924022, "res": {"Yes": 0.6964215894924022, "No": 0.3035589055001299}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3597310895960078, "res": {"No": 0.6402487348048272, "Yes": 0.3597310895960078}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6927118757184414, "res": {"Yes": 0.6927118757184414, "No": 0.3072588890357655}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7582368008123792, "res": {"Yes": 0.7582368008123792, "No": 0.2417418156073748}, "ground_truth": 1}, {"key": "23944937", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6738757919453091, "res": {"Yes": 0.6738757919453091, "No": 0.3260982052114753}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5966836831358597, "res": {"Yes": 0.5966836831358597, "No": 0.40328998904981606}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.621662896625564, "res": {"Yes": 0.621662896625564, "No": 0.3783175563052826}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6942501477331029, "res": {"Yes": 0.6942501477331029, "No": 0.30572373855272933}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6738468630785235, "res": {"Yes": 0.6738468630785235, "No": 0.3261352194582856}, "ground_truth": 1}, {"key": "31753944", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7813593107180444, "res": {"Yes": 0.7813593107180444, "No": 0.21862275815277635}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6944883927710818, "res": {"Yes": 0.6944883927710818, "No": 0.3054934624831343}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5935954038495481, "res": {"Yes": 0.5935954038495481, "No": 0.40638975182575643}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.519843850501031, "res": {"Yes": 0.519843850501031, "No": 0.48013551116330866}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6562162926345197, "res": {"Yes": 0.6562162926345197, "No": 0.3437623855360902}, "ground_truth": 1}, {"key": "35527214", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6451135378519348, "res": {"Yes": 0.6451135378519348, "No": 0.35486643490743514}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.49820534379861037, "res": {"No": 0.5017767747494912, "Yes": 0.49820534379861037}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4455689830280069, "res": {"No": 0.5544159287542366, "Yes": 0.4455689830280069}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.27914983452712205, "res": {"No": 0.7208338010420214, "Yes": 0.27914983452712205}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5409812276990896, "res": {"Yes": 0.5409812276990896, "No": 0.45900046768524894}, "ground_truth": 1}, {"key": "40400404", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5317435791052936, "res": {"Yes": 0.5317435791052936, "No": 0.4682347997550491}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5045954045152817, "res": {"Yes": 0.5045954045152817, "No": 0.4953928177066401}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2953009420770891, "res": {"No": 0.7046640461712775, "Yes": 0.2953009420770891}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6542647192019762, "res": {"Yes": 0.6542647192019762, "No": 0.3456938576758292}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7366028911394392, "res": {"Yes": 0.7366028911394392, "No": 0.2633546437053799}, "ground_truth": 1}, {"key": "21713119", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7569910867898032, "res": {"Yes": 0.7569910867898032, "No": 0.24297138494585585}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6861543819507476, "res": {"Yes": 0.6861543819507476, "No": 0.31379226137421246}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5863562963041186, "res": {"Yes": 0.5863562963041186, "No": 0.41361605038530463}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.714907782593412, "res": {"Yes": 0.714907782593412, "No": 0.28505979890599115}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6872467162838983, "res": {"Yes": 0.6872467162838983, "No": 0.3127280862611435}, "ground_truth": 1}, {"key": "28730678", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.44767769781376715, "res": {"No": 0.5523043974715264, "Yes": 0.44767769781376715}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.729764353774828, "res": {"Yes": 0.729764353774828, "No": 0.2702031758024849}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.28005742711586346, "res": {"No": 0.7199157051547102, "Yes": 0.28005742711586346}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.43472265323645487, "res": {"No": 0.5652456859290116, "Yes": 0.43472265323645487}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3626223660975894, "res": {"No": 0.6373440240771222, "Yes": 0.3626223660975894}, "ground_truth": 1}, {"key": "36823733", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4116905516783436, "res": {"No": 0.5882691486578027, "Yes": 0.4116905516783436}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.41589597919525356, "res": {"No": 0.584065876669131, "Yes": 0.41589597919525356}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.68213679641414, "res": {"Yes": 0.68213679641414, "No": 0.3178474907747752}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7907588064707745, "res": {"Yes": 0.7907588064707745, "No": 0.20922191417645422}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7747252721676177, "res": {"Yes": 0.7747252721676177, "No": 0.2252546137289538}, "ground_truth": 1}, {"key": "35988862", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.686959046924659, "res": {"Yes": 0.686959046924659, "No": 0.3130124227288587}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5124029765195227, "res": {"Yes": 0.5124029765195227, "No": 0.4875796096648109}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4084362645452498, "res": {"No": 0.5915492122230169, "Yes": 0.4084362645452498}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3178319166292969, "res": {"No": 0.6821515375495879, "Yes": 0.3178319166292969}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.542371981617556, "res": {"Yes": 0.542371981617556, "No": 0.4576072021848899}, "ground_truth": 1}, {"key": "40499665", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.41780373091202905, "res": {"No": 0.5821745279510664, "Yes": 0.41780373091202905}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.38541891319898103, "res": {"No": 0.6145622827164038, "Yes": 0.38541891319898103}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2499088319072574, "res": {"No": 0.7500779833928277, "Yes": 0.2499088319072574}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6160411473705615, "res": {"Yes": 0.6160411473705615, "No": 0.3839376344004134}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6488261057593844, "res": {"Yes": 0.6488261057593844, "No": 0.3511589180510639}, "ground_truth": 1}, {"key": "32829820", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6825663094084538, "res": {"Yes": 0.6825663094084538, "No": 0.31740830674912857}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.574809188123408, "res": {"Yes": 0.574809188123408, "No": 0.4251680144762095}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.43593817332009216, "res": {"No": 0.5640297108835605, "Yes": 0.43593817332009216}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6958005401249063, "res": {"Yes": 0.6958005401249063, "No": 0.3041502062792908}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6544310020794274, "res": {"Yes": 0.6544310020794274, "No": 0.34554897318060335}, "ground_truth": 1}, {"key": "20583553", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6470425639593687, "res": {"Yes": 0.6470425639593687, "No": 0.35291865065821554}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7112459910802585, "res": {"Yes": 0.7112459910802585, "No": 0.2887176090178365}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6540353741979524, "res": {"Yes": 0.6540353741979524, "No": 0.34593340276790535}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5584716850318883, "res": {"Yes": 0.5584716850318883, "No": 0.44149263978753245}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5306249055044646, "res": {"Yes": 0.5306249055044646, "No": 0.4693380130475374}, "ground_truth": 1}, {"key": "30501550", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5048739423377434, "res": {"Yes": 0.5048739423377434, "No": 0.4950832741284974}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4910869398292926, "res": {"No": 0.5088819880003882, "Yes": 0.4910869398292926}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.46694012571186627, "res": {"No": 0.5330284761877446, "Yes": 0.46694012571186627}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6446464383993572, "res": {"Yes": 0.6446464383993572, "No": 0.3553251120542656}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5625019940117878, "res": {"Yes": 0.5625019940117878, "No": 0.4374707948680364}, "ground_truth": 1}, {"key": "38755897", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6928566537735611, "res": {"Yes": 0.6928566537735611, "No": 0.30711979370436965}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7385968288747373, "res": {"Yes": 0.7385968288747373, "No": 0.26137963192840574}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5351488213611182, "res": {"Yes": 0.5351488213611182, "No": 0.464838056334854}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7485200264770611, "res": {"Yes": 0.7485200264770611, "No": 0.25145792491465047}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7301608402492733, "res": {"Yes": 0.7301608402492733, "No": 0.26981579326147476}, "ground_truth": 1}, {"key": "35507201", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.74121899317532, "res": {"Yes": 0.74121899317532, "No": 0.2587605402413357}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7018769536643623, "res": {"Yes": 0.7018769536643623, "No": 0.2981045843059163}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4568394603807877, "res": {"No": 0.5431439189822475, "Yes": 0.4568394603807877}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4751327216387477, "res": {"No": 0.524848725403496, "Yes": 0.4751327216387477}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6186168377362503, "res": {"Yes": 0.6186168377362503, "No": 0.38136456417642395}, "ground_truth": 1}, {"key": "36453511", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5321975627629761, "res": {"Yes": 0.5321975627629761, "No": 0.46777811908818256}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5377203551083002, "res": {"Yes": 0.5377203551083002, "No": 0.4622601736404178}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.35190332007061476, "res": {"No": 0.6480794254513474, "Yes": 0.35190332007061476}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3106737353347693, "res": {"No": 0.6893045418750664, "Yes": 0.3106737353347693}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.46983415887636665, "res": {"No": 0.5301331911239922, "Yes": 0.46983415887636665}, "ground_truth": 1}, {"key": "38066835", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.34241151671994163, "res": {"No": 0.6575588915788887, "Yes": 0.34241151671994163}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.49907421342020053, "res": {"No": 0.5008947198498698, "Yes": 0.49907421342020053}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5317939376066723, "res": {"Yes": 0.5317939376066723, "No": 0.46818268812190256}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6545630272167745, "res": {"Yes": 0.6545630272167745, "No": 0.3454071544374012}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7941995237064787, "res": {"Yes": 0.7941995237064787, "No": 0.20577572847018813}, "ground_truth": 1}, {"key": "39697181", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.710802475508637, "res": {"Yes": 0.710802475508637, "No": 0.2891722348642297}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6708694642878101, "res": {"Yes": 0.6708694642878101, "No": 0.32910106070181794}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.43873860765406075, "res": {"No": 0.5612397853012384, "Yes": 0.43873860765406075}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.2817353003765113, "res": {"No": 0.7182503312014831, "Yes": 0.2817353003765113}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.268195255083662, "res": {"No": 0.7317845199570769, "Yes": 0.268195255083662}, "ground_truth": 1}, {"key": "21820893", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3255919398241474, "res": {"No": 0.6743855762856505, "Yes": 0.3255919398241474}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.220907238692635, "res": {"No": 0.7790661890755469, "Yes": 0.220907238692635}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.10270302579686393, "res": {"No": 0.8972935310987998, "Yes": 0.10270302579686393}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8323215453881652, "res": {"Yes": 0.8323215453881652, "No": 0.16766626385645228}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6522718017979766, "res": {"Yes": 0.6522718017979766, "No": 0.34771906837983524}, "ground_truth": 1}, {"key": "40519933", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6069344705564528, "res": {"Yes": 0.6069344705564528, "No": 0.3930520630236033}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6940197782237041, "res": {"Yes": 0.6940197782237041, "No": 0.3059681706266271}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.24958688198944937, "res": {"No": 0.7503973595647532, "Yes": 0.24958688198944937}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8405035268575783, "res": {"Yes": 0.8405035268575783, "No": 0.15948029606994818}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7228409262854828, "res": {"Yes": 0.7228409262854828, "No": 0.2771316818540819}, "ground_truth": 1}, {"key": "30446033", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8308248969401746, "res": {"Yes": 0.8308248969401746, "No": 0.1691548857577884}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7507024280703942, "res": {"Yes": 0.7507024280703942, "No": 0.24927389677791761}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5028676624596721, "res": {"Yes": 0.5028676624596721, "No": 0.4971048347592098}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6562408355828145, "res": {"Yes": 0.6562408355828145, "No": 0.3437267392250033}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6394953879191231, "res": {"Yes": 0.6394953879191231, "No": 0.36048028921257214}, "ground_truth": 1}, {"key": "40216291", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5749335557955326, "res": {"Yes": 0.5749335557955326, "No": 0.42504025368071524}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5133125500385909, "res": {"Yes": 0.5133125500385909, "No": 0.4866568618667301}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44371263702096425, "res": {"No": 0.5562633420953212, "Yes": 0.44371263702096425}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7533351077246391, "res": {"Yes": 0.7533351077246391, "No": 0.24663422755805336}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7366616817621896, "res": {"Yes": 0.7366616817621896, "No": 0.2633073757892572}, "ground_truth": 1}, {"key": "33479118", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.719120155845541, "res": {"Yes": 0.719120155845541, "No": 0.2808492585580165}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5975203363640156, "res": {"Yes": 0.5975203363640156, "No": 0.4024406083119768}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2389218184552404, "res": {"No": 0.7610449163981584, "Yes": 0.2389218184552404}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4815275896541201, "res": {"No": 0.5184357365883249, "Yes": 0.4815275896541201}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.42595426399095815, "res": {"No": 0.5740112175979261, "Yes": 0.42595426399095815}, "ground_truth": 1}, {"key": "22297373", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4549550527843935, "res": {"No": 0.5450034467646959, "Yes": 0.4549550527843935}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.43790647009683636, "res": {"No": 0.5620525096006305, "Yes": 0.43790647009683636}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4360843460935398, "res": {"No": 0.563876738572291, "Yes": 0.4360843460935398}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4519381702450354, "res": {"No": 0.5480250946092607, "Yes": 0.4519381702450354}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6027522976396755, "res": {"Yes": 0.6027522976396755, "No": 0.39721054453333793}, "ground_truth": 1}, {"key": "36463668", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7545648375548899, "res": {"Yes": 0.7545648375548899, "No": 0.24540111576402351}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6067083385626606, "res": {"Yes": 0.6067083385626606, "No": 0.39326549319264564}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5283224399196715, "res": {"Yes": 0.5283224399196715, "No": 0.4716596660405086}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7346871622258453, "res": {"Yes": 0.7346871622258453, "No": 0.26529146220992195}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.797041333644738, "res": {"Yes": 0.797041333644738, "No": 0.20293340661313553}, "ground_truth": 1}, {"key": "35264615", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8438045137445768, "res": {"Yes": 0.8438045137445768, "No": 0.15616497476175648}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7529032541357433, "res": {"Yes": 0.7529032541357433, "No": 0.24707320740816957}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2943076294563711, "res": {"No": 0.7056720272947153, "Yes": 0.2943076294563711}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4531257944979268, "res": {"No": 0.5468493313127223, "Yes": 0.4531257944979268}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4886974464055075, "res": {"No": 0.5112760087798943, "Yes": 0.4886974464055075}, "ground_truth": 1}, {"key": "39898482", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.49237187721554204, "res": {"No": 0.5076062654174981, "Yes": 0.49237187721554204}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5558826100649322, "res": {"Yes": 0.5558826100649322, "No": 0.44409960771957335}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7634516065696954, "res": {"Yes": 0.7634516065696954, "No": 0.2365179914876673}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5508107694171848, "res": {"Yes": 0.5508107694171848, "No": 0.449172085835494}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6888825134481765, "res": {"Yes": 0.6888825134481765, "No": 0.3111012366493935}, "ground_truth": 1}, {"key": "37228721", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7744498288375614, "res": {"Yes": 0.7744498288375614, "No": 0.22552826143971097}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6666761121390217, "res": {"Yes": 0.6666761121390217, "No": 0.333301031121287}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.23145738603564842, "res": {"No": 0.7684837586953018, "Yes": 0.23145738603564842}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5505668252977205, "res": {"Yes": 0.5505668252977205, "No": 0.449384401251094}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6515589128683119, "res": {"Yes": 0.6515589128683119, "No": 0.34839736401689214}, "ground_truth": 1}, {"key": "24535799", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.49731224032555277, "res": {"No": 0.502632445823632, "Yes": 0.49731224032555277}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6151084040258937, "res": {"Yes": 0.6151084040258937, "No": 0.38484791065571833}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5046303489569818, "res": {"Yes": 0.5046303489569818, "No": 0.4953534157289572}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6136318950998194, "res": {"Yes": 0.6136318950998194, "No": 0.3863342699264232}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.714685831038711, "res": {"Yes": 0.714685831038711, "No": 0.28528400104220225}, "ground_truth": 1}, {"key": "35177759", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5234625442195755, "res": {"Yes": 0.5234625442195755, "No": 0.47651262069270933}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6101324769903047, "res": {"Yes": 0.6101324769903047, "No": 0.3898462571564291}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5402364850563236, "res": {"Yes": 0.5402364850563236, "No": 0.459744122362642}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6826317706563427, "res": {"Yes": 0.6826317706563427, "No": 0.3173370248486898}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6171041923788128, "res": {"Yes": 0.6171041923788128, "No": 0.3828611454705268}, "ground_truth": 1}, {"key": "34364829", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6646783563475122, "res": {"Yes": 0.6646783563475122, "No": 0.3352907544009595}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6026569799012527, "res": {"Yes": 0.6026569799012527, "No": 0.3973121401484745}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.624801112430312, "res": {"Yes": 0.624801112430312, "No": 0.3751687553391621}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6508709824858587, "res": {"Yes": 0.6508709824858587, "No": 0.3491031994711787}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6573187949160032, "res": {"Yes": 0.6573187949160032, "No": 0.34265355019801347}, "ground_truth": 1}, {"key": "38090732", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7087865752363042, "res": {"Yes": 0.7087865752363042, "No": 0.2911851674242465}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6784520993922626, "res": {"Yes": 0.6784520993922626, "No": 0.3215220027032571}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3773282049882561, "res": {"No": 0.6226551155982114, "Yes": 0.3773282049882561}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6354171097393839, "res": {"Yes": 0.6354171097393839, "No": 0.3645651884645056}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7080582957840666, "res": {"Yes": 0.7080582957840666, "No": 0.291923674377528}, "ground_truth": 1}, {"key": "30651479", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6994291686326166, "res": {"Yes": 0.6994291686326166, "No": 0.30055347122135856}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7211989092961503, "res": {"Yes": 0.7211989092961503, "No": 0.27878296586709744}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2741804534870713, "res": {"No": 0.7257943273168269, "Yes": 0.2741804534870713}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.36384679238132167, "res": {"No": 0.6361154162594705, "Yes": 0.36384679238132167}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5590403645145733, "res": {"Yes": 0.5590403645145733, "No": 0.4409166912989203}, "ground_truth": 1}, {"key": "39380921", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6060220545064819, "res": {"Yes": 0.6060220545064819, "No": 0.3939363621954318}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6852625907616002, "res": {"Yes": 0.6852625907616002, "No": 0.3146937925759571}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.48662119122610015, "res": {"No": 0.5133601003823611, "Yes": 0.48662119122610015}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7482050855836294, "res": {"Yes": 0.7482050855836294, "No": 0.2517705303908759}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8093812274314782, "res": {"Yes": 0.8093812274314782, "No": 0.19059245005698}, "ground_truth": 1}, {"key": "39037490", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8142048387343532, "res": {"Yes": 0.8142048387343532, "No": 0.1857606986507214}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7548721740205697, "res": {"Yes": 0.7548721740205697, "No": 0.2450968108893697}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6844912619023864, "res": {"Yes": 0.6844912619023864, "No": 0.31549403616014166}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7606673643719237, "res": {"Yes": 0.7606673643719237, "No": 0.23931078886062782}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7202141648653494, "res": {"Yes": 0.7202141648653494, "No": 0.279763409239643}, "ground_truth": 1}, {"key": "35917499", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6390296915721391, "res": {"Yes": 0.6390296915721391, "No": 0.36095022898565793}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7626740456171885, "res": {"Yes": 0.7626740456171885, "No": 0.23730278011402672}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.567435552472818, "res": {"Yes": 0.567435552472818, "No": 0.43253769514650414}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8065143972962142, "res": {"Yes": 0.8065143972962142, "No": 0.19346232273876146}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6537532580385825, "res": {"Yes": 0.6537532580385825, "No": 0.34620389000815227}, "ground_truth": 1}, {"key": "34908073", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7245851824591387, "res": {"Yes": 0.7245851824591387, "No": 0.275389477907172}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6992775837889164, "res": {"Yes": 0.6992775837889164, "No": 0.3006958771268519}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.10612449424666527, "res": {"No": 0.8938629011383428, "Yes": 0.10612449424666527}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.42154584126681466, "res": {"No": 0.5784101846364434, "Yes": 0.42154584126681466}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.31138727009811284, "res": {"No": 0.6885893598885189, "Yes": 0.31138727009811284}, "ground_truth": 1}, {"key": "36344759", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4092399336914202, "res": {"No": 0.5907369817355499, "Yes": 0.4092399336914202}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.2823130831360746, "res": {"No": 0.7176603155499387, "Yes": 0.2823130831360746}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5731462610229597, "res": {"Yes": 0.5731462610229597, "No": 0.4268312853964659}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.47004492675778703, "res": {"No": 0.5299321762311168, "Yes": 0.47004492675778703}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7695974908238312, "res": {"Yes": 0.7695974908238312, "No": 0.2303850130044125}, "ground_truth": 1}, {"key": "39984637", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7368395628315729, "res": {"Yes": 0.7368395628315729, "No": 0.2631469914712332}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6858759009680477, "res": {"Yes": 0.6858759009680477, "No": 0.3141103254023398}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4823423246018529, "res": {"No": 0.5176219134715818, "Yes": 0.4823423246018529}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5013432614060546, "res": {"Yes": 0.5013432614060546, "No": 0.49859970477537746}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.52369640622409, "res": {"Yes": 0.52369640622409, "No": 0.47625745458110047}, "ground_truth": 1}, {"key": "17917326", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.53320282099675, "res": {"Yes": 0.53320282099675, "No": 0.4667491115703679}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4388923773773747, "res": {"No": 0.56106502560902, "Yes": 0.4388923773773747}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5482212953048008, "res": {"Yes": 0.5482212953048008, "No": 0.4517534556792689}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6996044535542232, "res": {"Yes": 0.6996044535542232, "No": 0.30037030965861844}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6085574491001899, "res": {"Yes": 0.6085574491001899, "No": 0.3914167460237197}, "ground_truth": 1}, {"key": "32193638", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7412394955762182, "res": {"Yes": 0.7412394955762182, "No": 0.25874154791470894}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5748495871327539, "res": {"Yes": 0.5748495871327539, "No": 0.4251257208658485}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.65158347710236, "res": {"Yes": 0.65158347710236, "No": 0.34839252132718906}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6572332898757685, "res": {"Yes": 0.6572332898757685, "No": 0.3427501578500231}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.502528929279783, "res": {"Yes": 0.502528929279783, "No": 0.49745455663638916}, "ground_truth": 1}, {"key": "34564692", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5676081018078124, "res": {"Yes": 0.5676081018078124, "No": 0.4323714163718633}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.39285413255243223, "res": {"No": 0.6071277310463826, "Yes": 0.39285413255243223}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.718391567466086, "res": {"Yes": 0.718391567466086, "No": 0.28153339672068406}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7291079342331372, "res": {"Yes": 0.7291079342331372, "No": 0.27084569809063236}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7189910278427047, "res": {"Yes": 0.7189910278427047, "No": 0.2809520401044601}, "ground_truth": 1}, {"key": "39329284", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6883902348707088, "res": {"Yes": 0.6883902348707088, "No": 0.31157643302075105}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.21711988772631693, "res": {"No": 0.7827949771487717, "Yes": 0.21711988772631693}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4828416142088632, "res": {"No": 0.5171397663017843, "Yes": 0.4828416142088632}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5868126942134752, "res": {"Yes": 0.5868126942134752, "No": 0.4131657809105876}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7581807009469272, "res": {"Yes": 0.7581807009469272, "No": 0.24179768859683695}, "ground_truth": 1}, {"key": "37438541", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7441678237720131, "res": {"Yes": 0.7441678237720131, "No": 0.2558154993499524}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6301801172887332, "res": {"Yes": 0.6301801172887332, "No": 0.3698036832371084}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3662347345240225, "res": {"No": 0.633751073622046, "Yes": 0.3662347345240225}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.617818885506501, "res": {"Yes": 0.617818885506501, "No": 0.38214678127616836}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6163448688981218, "res": {"Yes": 0.6163448688981218, "No": 0.38363269791268617}, "ground_truth": 1}, {"key": "34652757", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5688454492161619, "res": {"Yes": 0.5688454492161619, "No": 0.43112601647544585}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6640204047052986, "res": {"Yes": 0.6640204047052986, "No": 0.33594994611899215}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6335154761005014, "res": {"Yes": 0.6335154761005014, "No": 0.36646187046429296}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7315349800851536, "res": {"Yes": 0.7315349800851536, "No": 0.26845072538336484}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6767859705484865, "res": {"Yes": 0.6767859705484865, "No": 0.323194296325064}, "ground_truth": 1}, {"key": "31361004", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7116636079210263, "res": {"Yes": 0.7116636079210263, "No": 0.288324527974918}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6349164649518501, "res": {"Yes": 0.6349164649518501, "No": 0.3650632327474715}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.47365536490317334, "res": {"No": 0.5263276560139798, "Yes": 0.47365536490317334}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4484946169035593, "res": {"No": 0.551484210940171, "Yes": 0.4484946169035593}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.532806441460912, "res": {"Yes": 0.532806441460912, "No": 0.4671677864877199}, "ground_truth": 1}, {"key": "26150727", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6195141110777761, "res": {"Yes": 0.6195141110777761, "No": 0.3804555988802093}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.657381893975518, "res": {"Yes": 0.657381893975518, "No": 0.34257930521841967}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6192395413352152, "res": {"Yes": 0.6192395413352152, "No": 0.38074641609588145}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.40255166101978795, "res": {"No": 0.5974242150245092, "Yes": 0.40255166101978795}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5629389633231298, "res": {"Yes": 0.5629389633231298, "No": 0.4370297099683091}, "ground_truth": 1}, {"key": "36997402", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5583355238976502, "res": {"Yes": 0.5583355238976502, "No": 0.4416351015378886}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4879924229457712, "res": {"No": 0.5119875093709878, "Yes": 0.4879924229457712}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3339957869523876, "res": {"No": 0.6659882175264296, "Yes": 0.3339957869523876}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8123380806435463, "res": {"Yes": 0.8123380806435463, "No": 0.1876461257057134}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6931221449391012, "res": {"Yes": 0.6931221449391012, "No": 0.3068573798763597}, "ground_truth": 1}, {"key": "37430643", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5469130757857358, "res": {"Yes": 0.5469130757857358, "No": 0.4530610927542869}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7008227058392821, "res": {"Yes": 0.7008227058392821, "No": 0.29915145361708634}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6431000616355556, "res": {"Yes": 0.6431000616355556, "No": 0.35687631993027435}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7399582598373362, "res": {"Yes": 0.7399582598373362, "No": 0.2600194351976801}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7091615516097075, "res": {"Yes": 0.7091615516097075, "No": 0.2908145791357095}, "ground_truth": 1}, {"key": "36964631", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7190829782945318, "res": {"Yes": 0.7190829782945318, "No": 0.28089152955224206}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7773999226984686, "res": {"Yes": 0.7773999226984686, "No": 0.2225729646772047}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6025198609067814, "res": {"Yes": 0.6025198609067814, "No": 0.3974642444511021}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5200704114181194, "res": {"Yes": 0.5200704114181194, "No": 0.47991158018331315}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7912782525000502, "res": {"Yes": 0.7912782525000502, "No": 0.20870032659467308}, "ground_truth": 1}, {"key": "35502013", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6679310562356494, "res": {"Yes": 0.6679310562356494, "No": 0.33204721709908913}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.47219865627688, "res": {"No": 0.5277854091247196, "Yes": 0.47219865627688}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5840005233541179, "res": {"Yes": 0.5840005233541179, "No": 0.4159811218162448}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5468923481729543, "res": {"Yes": 0.5468923481729543, "No": 0.45308970899659673}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6866576342211529, "res": {"Yes": 0.6866576342211529, "No": 0.3133259990335147}, "ground_truth": 1}, {"key": "33987664", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5803219170598456, "res": {"Yes": 0.5803219170598456, "No": 0.4196605956471888}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.49288384560070925, "res": {"No": 0.5070971380275443, "Yes": 0.49288384560070925}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5599844519574924, "res": {"Yes": 0.5599844519574924, "No": 0.43998726309507974}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7443880928321649, "res": {"Yes": 0.7443880928321649, "No": 0.255588333782216}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8067451418065186, "res": {"Yes": 0.8067451418065186, "No": 0.19323366942524337}, "ground_truth": 1}, {"key": "35203721", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7137783136050744, "res": {"Yes": 0.7137783136050744, "No": 0.28619459426532323}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7112969536812328, "res": {"Yes": 0.7112969536812328, "No": 0.28867823062163417}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5646434550738861, "res": {"Yes": 0.5646434550738861, "No": 0.43533425528928116}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7303398538184487, "res": {"Yes": 0.7303398538184487, "No": 0.269641144084111}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7376381915119492, "res": {"Yes": 0.7376381915119492, "No": 0.26234112979460117}, "ground_truth": 1}, {"key": "39028348", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.758351970563456, "res": {"Yes": 0.758351970563456, "No": 0.24163467520993973}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.705923467739609, "res": {"Yes": 0.705923467739609, "No": 0.2940577801002212}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44303932195415324, "res": {"No": 0.5569362154859543, "Yes": 0.44303932195415324}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5361129030897647, "res": {"Yes": 0.5361129030897647, "No": 0.46385554530555967}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4253393321687272, "res": {"No": 0.5746362195797625, "Yes": 0.4253393321687272}, "ground_truth": 1}, {"key": "37459383", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4801181593794839, "res": {"No": 0.5198538315987788, "Yes": 0.4801181593794839}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5254383354918034, "res": {"Yes": 0.5254383354918034, "No": 0.474530113167802}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4916966586955913, "res": {"No": 0.5082791370154016, "Yes": 0.4916966586955913}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4748058477899084, "res": {"No": 0.5251723418861882, "Yes": 0.4748058477899084}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7023444259654786, "res": {"Yes": 0.7023444259654786, "No": 0.2976160636980278}, "ground_truth": 1}, {"key": "34020070", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6945346333476041, "res": {"Yes": 0.6945346333476041, "No": 0.30543979199686627}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5492151389551583, "res": {"Yes": 0.5492151389551583, "No": 0.4507581211902528}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.48187655870649765, "res": {"No": 0.5181053909421652, "Yes": 0.48187655870649765}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6883061875542242, "res": {"Yes": 0.6883061875542242, "No": 0.31166970180413134}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6170569240080783, "res": {"Yes": 0.6170569240080783, "No": 0.38292384411640906}, "ground_truth": 1}, {"key": "35176615", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6726706601234025, "res": {"Yes": 0.6726706601234025, "No": 0.3273092946255396}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5821310993511881, "res": {"Yes": 0.5821310993511881, "No": 0.4178490650761669}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.49897186379534086, "res": {"No": 0.5010088567048171, "Yes": 0.49897186379534086}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.564702632808837, "res": {"Yes": 0.564702632808837, "No": 0.4352769168375678}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7091672391081583, "res": {"Yes": 0.7091672391081583, "No": 0.29081245619703056}, "ground_truth": 1}, {"key": "33296389", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6651104512585043, "res": {"Yes": 0.6651104512585043, "No": 0.3348662100207914}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5236901428525266, "res": {"Yes": 0.5236901428525266, "No": 0.47628718826211713}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.8047151621634822, "res": {"Yes": 0.8047151621634822, "No": 0.19526364655059716}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7078436096592989, "res": {"Yes": 0.7078436096592989, "No": 0.29214039133916636}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7450256586907681, "res": {"Yes": 0.7450256586907681, "No": 0.25496163401151045}, "ground_truth": 1}, {"key": "35399504", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7173294356189782, "res": {"Yes": 0.7173294356189782, "No": 0.28265104463699603}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6895188592887003, "res": {"Yes": 0.6895188592887003, "No": 0.31045696073064355}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5421696929067695, "res": {"Yes": 0.5421696929067695, "No": 0.4578083372839853}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.641612480800371, "res": {"Yes": 0.641612480800371, "No": 0.3583638743414821}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.714945137500941, "res": {"Yes": 0.714945137500941, "No": 0.28502901411011816}, "ground_truth": 1}, {"key": "34807886", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7254394281090125, "res": {"Yes": 0.7254394281090125, "No": 0.27453816310255374}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5677411817734779, "res": {"Yes": 0.5677411817734779, "No": 0.43223694383468464}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.43482786450083505, "res": {"No": 0.5651603967902322, "Yes": 0.43482786450083505}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6946002560797319, "res": {"Yes": 0.6946002560797319, "No": 0.30537721379484184}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7360501382140945, "res": {"Yes": 0.7360501382140945, "No": 0.2639241045320701}, "ground_truth": 1}, {"key": "37629813", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7270824766111897, "res": {"Yes": 0.7270824766111897, "No": 0.2729015149451996}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.71343327807345, "res": {"Yes": 0.71343327807345, "No": 0.2865378900753238}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.33576337774808573, "res": {"No": 0.6642240511436737, "Yes": 0.33576337774808573}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4725610897166572, "res": {"No": 0.5274213628028481, "Yes": 0.4725610897166572}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4975739451306007, "res": {"No": 0.502407035572524, "Yes": 0.4975739451306007}, "ground_truth": 1}, {"key": "28084389", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5884533645657429, "res": {"Yes": 0.5884533645657429, "No": 0.41152895369151515}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5637533983884021, "res": {"Yes": 0.5637533983884021, "No": 0.4362268817469004}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4894341945808022, "res": {"No": 0.5105488783129725, "Yes": 0.4894341945808022}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.2684047973935033, "res": {"No": 0.7315744840406755, "Yes": 0.2684047973935033}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4269261933461994, "res": {"No": 0.5730419235128097, "Yes": 0.4269261933461994}, "ground_truth": 1}, {"key": "35391734", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3040671237925197, "res": {"No": 0.695907694700235, "Yes": 0.3040671237925197}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.47548191089601116, "res": {"No": 0.5244816434221958, "Yes": 0.47548191089601116}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5555090602246977, "res": {"Yes": 0.5555090602246977, "No": 0.44446614107015986}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.727602883002964, "res": {"Yes": 0.727602883002964, "No": 0.27237221789897265}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4953137395094111, "res": {"No": 0.5046582557868958, "Yes": 0.4953137395094111}, "ground_truth": 1}, {"key": "40214591", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6003607826862539, "res": {"Yes": 0.6003607826862539, "No": 0.3996131039810654}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6116052872603477, "res": {"Yes": 0.6116052872603477, "No": 0.3883582851925136}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4878018015464414, "res": {"No": 0.5121751923047825, "Yes": 0.4878018015464414}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6912191406244866, "res": {"Yes": 0.6912191406244866, "No": 0.30875521515262916}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.658120390570438, "res": {"Yes": 0.658120390570438, "No": 0.34185647286192533}, "ground_truth": 1}, {"key": "26283171", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6834362001790069, "res": {"Yes": 0.6834362001790069, "No": 0.31653574670496926}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6934562687329766, "res": {"Yes": 0.6934562687329766, "No": 0.3065225664659016}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7364799476459997, "res": {"Yes": 0.7364799476459997, "No": 0.2635021109071449}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7619109680128124, "res": {"Yes": 0.7619109680128124, "No": 0.2380653888448579}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7302779236247222, "res": {"Yes": 0.7302779236247222, "No": 0.269700579541814}, "ground_truth": 1}, {"key": "37084030", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7932872031224424, "res": {"Yes": 0.7932872031224424, "No": 0.20668609209917607}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7333418241386368, "res": {"Yes": 0.7333418241386368, "No": 0.26663630572376673}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6578160473761782, "res": {"Yes": 0.6578160473761782, "No": 0.3421633925549403}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7525459658790653, "res": {"Yes": 0.7525459658790653, "No": 0.24743830519158533}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.612913354311282, "res": {"Yes": 0.612913354311282, "No": 0.3870672068184886}, "ground_truth": 1}, {"key": "39027295", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6585428551249541, "res": {"Yes": 0.6585428551249541, "No": 0.34143908182426}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6311376275510289, "res": {"Yes": 0.6311376275510289, "No": 0.3688428708076739}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5221665660232289, "res": {"Yes": 0.5221665660232289, "No": 0.4778153443587902}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7008102803628597, "res": {"Yes": 0.7008102803628597, "No": 0.2991581247688851}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7098100357697087, "res": {"Yes": 0.7098100357697087, "No": 0.2901619974704886}, "ground_truth": 1}, {"key": "14018647", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7509932464510863, "res": {"Yes": 0.7509932464510863, "No": 0.24897457404507928}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6496727268782968, "res": {"Yes": 0.6496727268782968, "No": 0.3502917150751519}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.43711891683536475, "res": {"No": 0.5628595213531905, "Yes": 0.43711891683536475}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.24089300662065152, "res": {"No": 0.7590657865850315, "Yes": 0.24089300662065152}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2988900496926373, "res": {"No": 0.7010842876621638, "Yes": 0.2988900496926373}, "ground_truth": 1}, {"key": "37424289", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.30773138597108396, "res": {"No": 0.6922438230330891, "Yes": 0.30773138597108396}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3784670893814778, "res": {"No": 0.6215042560660701, "Yes": 0.3784670893814778}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5629067191027939, "res": {"Yes": 0.5629067191027939, "No": 0.437069700016288}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6401021922401122, "res": {"Yes": 0.6401021922401122, "No": 0.3598484530183675}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.698888963407131, "res": {"Yes": 0.698888963407131, "No": 0.30107210241864474}, "ground_truth": 1}, {"key": "37498031", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7821601218485871, "res": {"Yes": 0.7821601218485871, "No": 0.2178086835287561}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.526123869827578, "res": {"Yes": 0.526123869827578, "No": 0.47384420156427004}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.04383504356945117, "res": {"No": 0.9561337259617527, "Yes": 0.04383504356945117}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.43298300550769797, "res": {"No": 0.5669968107782056, "Yes": 0.43298300550769797}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.42482079406723333, "res": {"No": 0.5751509792742974, "Yes": 0.42482079406723333}, "ground_truth": 1}, {"key": "30104095", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6101483467424165, "res": {"Yes": 0.6101483467424165, "No": 0.3898214637229135}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.48932977025379026, "res": {"No": 0.5106463769296705, "Yes": 0.48932977025379026}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5886193906767688, "res": {"Yes": 0.5886193906767688, "No": 0.4113593564132039}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.483579573284202, "res": {"No": 0.5163972734201812, "Yes": 0.483579573284202}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4938984745603777, "res": {"No": 0.5060807993159332, "Yes": 0.4938984745603777}, "ground_truth": 1}, {"key": "37911407", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5271024431779286, "res": {"Yes": 0.5271024431779286, "No": 0.47286842520539474}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.461595090350765, "res": {"No": 0.5383793800257, "Yes": 0.461595090350765}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7516891987489961, "res": {"Yes": 0.7516891987489961, "No": 0.2482877309231401}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5965489791011921, "res": {"Yes": 0.5965489791011921, "No": 0.4034197079679785}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7318728077669782, "res": {"Yes": 0.7318728077669782, "No": 0.26810025033587076}, "ground_truth": 1}, {"key": "39177472", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8109905071924707, "res": {"Yes": 0.8109905071924707, "No": 0.18898103743268221}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7556454985806711, "res": {"Yes": 0.7556454985806711, "No": 0.24432939123337324}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4891191786897609, "res": {"No": 0.5108610007340965, "Yes": 0.4891191786897609}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5664080636691274, "res": {"Yes": 0.5664080636691274, "No": 0.4335774485547337}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5681923347848602, "res": {"Yes": 0.5681923347848602, "No": 0.43178495673928585}, "ground_truth": 1}, {"key": "32325454", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6500305481779122, "res": {"Yes": 0.6500305481779122, "No": 0.3499475825000638}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5268793626621446, "res": {"Yes": 0.5268793626621446, "No": 0.4731048523017193}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5379170838154985, "res": {"Yes": 0.5379170838154985, "No": 0.46205899557641444}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6844936850057425, "res": {"Yes": 0.6844936850057425, "No": 0.3154836881254643}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7021175772646896, "res": {"Yes": 0.7021175772646896, "No": 0.2978583324427303}, "ground_truth": 1}, {"key": "38395319", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7269705581493252, "res": {"Yes": 0.7269705581493252, "No": 0.2730057559373077}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.673309819095624, "res": {"Yes": 0.673309819095624, "No": 0.32666807002498655}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5931266071443209, "res": {"Yes": 0.5931266071443209, "No": 0.4068549277317306}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7310251170303526, "res": {"Yes": 0.7310251170303526, "No": 0.26895629088477546}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5371110332595082, "res": {"Yes": 0.5371110332595082, "No": 0.46287383806873067}, "ground_truth": 1}, {"key": "38235895", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6819603027119545, "res": {"Yes": 0.6819603027119545, "No": 0.31800896651863364}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.44246863429306216, "res": {"No": 0.5575114320158938, "Yes": 0.44246863429306216}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7289796225284735, "res": {"Yes": 0.7289796225284735, "No": 0.2710067637301648}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5664690124557642, "res": {"Yes": 0.5664690124557642, "No": 0.4335099804820165}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7115611784333292, "res": {"Yes": 0.7115611784333292, "No": 0.288415018409003}, "ground_truth": 1}, {"key": "26543267", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8085338040633512, "res": {"Yes": 0.8085338040633512, "No": 0.1914467455803746}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7115243632103752, "res": {"Yes": 0.7115243632103752, "No": 0.28845620701442826}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.1822717087428344, "res": {"No": 0.8176879208728935, "Yes": 0.1822717087428344}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5698516358595699, "res": {"Yes": 0.5698516358595699, "No": 0.43007849088951966}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5347683855662984, "res": {"Yes": 0.5347683855662984, "No": 0.46518676912681933}, "ground_truth": 1}, {"key": "39054728", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5228352364603329, "res": {"Yes": 0.5228352364603329, "No": 0.4771040727624856}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.26833316971221827, "res": {"No": 0.7316373216716331, "Yes": 0.26833316971221827}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.40264463703591125, "res": {"No": 0.5973251941936999, "Yes": 0.40264463703591125}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.37567113472623737, "res": {"No": 0.6243050736533006, "Yes": 0.37567113472623737}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5001941779752996, "res": {"Yes": 0.5001941779752996, "No": 0.49977647026041383}, "ground_truth": 1}, {"key": "39158443", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5941148073074293, "res": {"Yes": 0.5941148073074293, "No": 0.4058618939230439}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.25227959564258134, "res": {"No": 0.7477015110854819, "Yes": 0.25227959564258134}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6091974401232989, "res": {"Yes": 0.6091974401232989, "No": 0.39077527049478394}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6958181023521735, "res": {"Yes": 0.6958181023521735, "No": 0.3041451270132579}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6338543390967647, "res": {"Yes": 0.6338543390967647, "No": 0.3661051103728294}, "ground_truth": 1}, {"key": "36254201", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7273750843793622, "res": {"Yes": 0.7273750843793622, "No": 0.27259767192953277}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6200084202418372, "res": {"Yes": 0.6200084202418372, "No": 0.3799618598936127}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.11388898737387525, "res": {"No": 0.8860979370985822, "Yes": 0.11388898737387525}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7072052104274293, "res": {"Yes": 0.7072052104274293, "No": 0.29277291634353075}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7489300807169151, "res": {"Yes": 0.7489300807169151, "No": 0.25105254980263064}, "ground_truth": 1}, {"key": "23434347", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6503997403268998, "res": {"Yes": 0.6503997403268998, "No": 0.3495751216714256}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7624683039154847, "res": {"Yes": 0.7624683039154847, "No": 0.23750861083911148}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5582511322783371, "res": {"Yes": 0.5582511322783371, "No": 0.44173093350182396}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6945293896309175, "res": {"Yes": 0.6945293896309175, "No": 0.30545087966255563}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.516244907067556, "res": {"Yes": 0.516244907067556, "No": 0.4837357463411985}, "ground_truth": 1}, {"key": "34397620", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6630842784880852, "res": {"Yes": 0.6630842784880852, "No": 0.33689280004204525}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4864463796388749, "res": {"No": 0.513531113709119, "Yes": 0.4864463796388749}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.37365113911330766, "res": {"No": 0.6263246387826521, "Yes": 0.37365113911330766}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5785980075596737, "res": {"Yes": 0.5785980075596737, "No": 0.421385241824152}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7755001290164898, "res": {"Yes": 0.7755001290164898, "No": 0.22447833046493884}, "ground_truth": 1}, {"key": "34340916", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7155086719022709, "res": {"Yes": 0.7155086719022709, "No": 0.284473976671036}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6593509215928838, "res": {"Yes": 0.6593509215928838, "No": 0.34062725275290096}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5555013720325067, "res": {"Yes": 0.5555013720325067, "No": 0.44447780845949675}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.502433894970591, "res": {"Yes": 0.502433894970591, "No": 0.49754645492955607}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6471476263187846, "res": {"Yes": 0.6471476263187846, "No": 0.3528258452575376}, "ground_truth": 1}, {"key": "30375089", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5762549815133561, "res": {"Yes": 0.5762549815133561, "No": 0.42372865213457256}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6922840297219218, "res": {"Yes": 0.6922840297219218, "No": 0.30768821428619675}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5065787948844284, "res": {"Yes": 0.5065787948844284, "No": 0.493404773612279}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5712087553960037, "res": {"Yes": 0.5712087553960037, "No": 0.428769731744256}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5526848507796117, "res": {"Yes": 0.5526848507796117, "No": 0.44729108474828083}, "ground_truth": 1}, {"key": "35807797", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5996746624952352, "res": {"Yes": 0.5996746624952352, "No": 0.4003084516165578}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6240340280301069, "res": {"Yes": 0.6240340280301069, "No": 0.375940177742101}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6705188052813085, "res": {"Yes": 0.6705188052813085, "No": 0.3294621179283266}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7177624602344911, "res": {"Yes": 0.7177624602344911, "No": 0.282218128987091}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6512691639088138, "res": {"Yes": 0.6512691639088138, "No": 0.34870632034957433}, "ground_truth": 1}, {"key": "34188172", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6035724173708235, "res": {"Yes": 0.6035724173708235, "No": 0.39640893357969254}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6529381962827422, "res": {"Yes": 0.6529381962827422, "No": 0.34703883113778433}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7295627623282918, "res": {"Yes": 0.7295627623282918, "No": 0.27042083101587033}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.44245721874955857, "res": {"No": 0.5575193877607927, "Yes": 0.44245721874955857}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3489054885155939, "res": {"No": 0.6510770743517945, "Yes": 0.3489054885155939}, "ground_truth": 1}, {"key": "37075567", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.46463013430407635, "res": {"No": 0.5353411884138042, "Yes": 0.46463013430407635}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.28590042303335467, "res": {"No": 0.7140803771065882, "Yes": 0.28590042303335467}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5548654650144526, "res": {"Yes": 0.5548654650144526, "No": 0.4451170489741532}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5738354191476498, "res": {"Yes": 0.5738354191476498, "No": 0.4261398713930626}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7178169835417395, "res": {"Yes": 0.7178169835417395, "No": 0.2821518719492854}, "ground_truth": 1}, {"key": "35559735", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6519749096029549, "res": {"Yes": 0.6519749096029549, "No": 0.3479953017559817}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.46312538575169393, "res": {"No": 0.5368527664499326, "Yes": 0.46312538575169393}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4278479771804995, "res": {"No": 0.572138508035478, "Yes": 0.4278479771804995}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6848501662824952, "res": {"Yes": 0.6848501662824952, "No": 0.31513549178066397}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7842267566734215, "res": {"Yes": 0.7842267566734215, "No": 0.2157588565075371}, "ground_truth": 1}, {"key": "33005019", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7391329418233766, "res": {"Yes": 0.7391329418233766, "No": 0.260849439046261}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7218794216942517, "res": {"Yes": 0.7218794216942517, "No": 0.27809758547459257}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.142942475340615, "res": {"No": 0.8570318813223892, "Yes": 0.142942475340615}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.44833592274122547, "res": {"No": 0.5516456650276648, "Yes": 0.44833592274122547}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5464178515760546, "res": {"Yes": 0.5464178515760546, "No": 0.45353923372213883}, "ground_truth": 1}, {"key": "30808252", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.42004240857689595, "res": {"No": 0.5799333475862427, "Yes": 0.42004240857689595}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4174882578487138, "res": {"No": 0.5824843854476652, "Yes": 0.4174882578487138}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7919914204432978, "res": {"Yes": 0.7919914204432978, "No": 0.20799151362353668}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6733130375242514, "res": {"Yes": 0.6733130375242514, "No": 0.3266634640376715}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6779906918301966, "res": {"Yes": 0.6779906918301966, "No": 0.32199044750864414}, "ground_truth": 1}, {"key": "15159017", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5575443651888546, "res": {"Yes": 0.5575443651888546, "No": 0.4424323091093559}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.624344861883483, "res": {"Yes": 0.624344861883483, "No": 0.37563416674890815}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5380721284799711, "res": {"Yes": 0.5380721284799711, "No": 0.46190926652085224}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.49710908005262605, "res": {"No": 0.5028700460580413, "Yes": 0.49710908005262605}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5172321098507825, "res": {"Yes": 0.5172321098507825, "No": 0.4827464072302578}, "ground_truth": 1}, {"key": "24493400", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.46118443042164325, "res": {"No": 0.5387937146361272, "Yes": 0.46118443042164325}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4362667852447324, "res": {"No": 0.5637103630966471, "Yes": 0.4362667852447324}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.41511964462532375, "res": {"No": 0.5848589920708643, "Yes": 0.41511964462532375}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.48110771222794874, "res": {"No": 0.5188716131110146, "Yes": 0.48110771222794874}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5266315768937302, "res": {"Yes": 0.5266315768937302, "No": 0.4733389741062824}, "ground_truth": 1}, {"key": "37791071", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5342488699464488, "res": {"Yes": 0.5342488699464488, "No": 0.4657269037975104}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5632442884879637, "res": {"Yes": 0.5632442884879637, "No": 0.43673162630000517}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5312079047503522, "res": {"Yes": 0.5312079047503522, "No": 0.4687687652338104}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5618948197913515, "res": {"Yes": 0.5618948197913515, "No": 0.4380893473610112}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5254391446674631, "res": {"Yes": 0.5254391446674631, "No": 0.47453538048129174}, "ground_truth": 1}, {"key": "33528627", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5890263261380175, "res": {"Yes": 0.5890263261380175, "No": 0.41095025741407637}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5151440029630916, "res": {"Yes": 0.5151440029630916, "No": 0.4848282376235966}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5890221735170562, "res": {"Yes": 0.5890221735170562, "No": 0.41096225733679087}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5596272566481562, "res": {"Yes": 0.5596272566481562, "No": 0.44035201845042593}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.45244790479260216, "res": {"No": 0.5475298764072158, "Yes": 0.45244790479260216}, "ground_truth": 1}, {"key": "39925662", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.576334302707771, "res": {"Yes": 0.576334302707771, "No": 0.42363989028007926}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4650516054919384, "res": {"No": 0.5349302416643493, "Yes": 0.4650516054919384}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.27799131688664497, "res": {"No": 0.7219835675314838, "Yes": 0.27799131688664497}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6740302282769003, "res": {"Yes": 0.6740302282769003, "No": 0.32594843010197794}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6238559291766236, "res": {"Yes": 0.6238559291766236, "No": 0.3761082304766043}, "ground_truth": 1}, {"key": "29213416", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7152906610096023, "res": {"Yes": 0.7152906610096023, "No": 0.28467713515177284}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6713833658925269, "res": {"Yes": 0.6713833658925269, "No": 0.3285845145572205}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.523275596789579, "res": {"Yes": 0.523275596789579, "No": 0.4767014380970751}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7640862144832528, "res": {"Yes": 0.7640862144832528, "No": 0.23589969157711257}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7567888003846841, "res": {"Yes": 0.7567888003846841, "No": 0.24319434053192973}, "ground_truth": 1}, {"key": "34492745", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.737840250905983, "res": {"Yes": 0.737840250905983, "No": 0.26213936215929995}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5548057092217777, "res": {"Yes": 0.5548057092217777, "No": 0.4451820185484903}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3554753752750485, "res": {"No": 0.6445120242927317, "Yes": 0.3554753752750485}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.646244974236368, "res": {"Yes": 0.646244974236368, "No": 0.35373702823407266}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6546480342908787, "res": {"Yes": 0.6546480342908787, "No": 0.34533010269668757}, "ground_truth": 1}, {"key": "34191937", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6528088620370386, "res": {"Yes": 0.6528088620370386, "No": 0.34717003661222684}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6317721007160335, "res": {"Yes": 0.6317721007160335, "No": 0.36820939296924704}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2626451755793647, "res": {"No": 0.7373390366346386, "Yes": 0.2626451755793647}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.560659651154355, "res": {"Yes": 0.560659651154355, "No": 0.43931286640699185}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6457235357740407, "res": {"Yes": 0.6457235357740407, "No": 0.354251346298278}, "ground_truth": 1}, {"key": "34933372", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6282664745383384, "res": {"Yes": 0.6282664745383384, "No": 0.3717133820649455}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6519378263247552, "res": {"Yes": 0.6519378263247552, "No": 0.34803521910630936}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3860199796907453, "res": {"No": 0.6139729544083589, "Yes": 0.3860199796907453}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.1651797671954004, "res": {"No": 0.8348074829963233, "Yes": 0.1651797671954004}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3757400842194943, "res": {"No": 0.6242398559089642, "Yes": 0.3757400842194943}, "ground_truth": 1}, {"key": "38714379", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2271859349684765, "res": {"No": 0.7727934900250026, "Yes": 0.2271859349684765}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.2767288591536334, "res": {"No": 0.7232564912889319, "Yes": 0.2767288591536334}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.545272973993181, "res": {"Yes": 0.545272973993181, "No": 0.4547080110439077}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.29342338880656005, "res": {"No": 0.7065561526312504, "Yes": 0.29342338880656005}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.27596252540547045, "res": {"No": 0.724017149298912, "Yes": 0.27596252540547045}, "ground_truth": 1}, {"key": "39220660", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3646567422774291, "res": {"No": 0.6353197268221047, "Yes": 0.3646567422774291}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.2328968563584063, "res": {"No": 0.7670859530063682, "Yes": 0.2328968563584063}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.39480932979596334, "res": {"No": 0.6051679234755974, "Yes": 0.39480932979596334}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5828763195451911, "res": {"Yes": 0.5828763195451911, "No": 0.4170884372219936}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.46311031126572627, "res": {"No": 0.5368680669718078, "Yes": 0.46311031126572627}, "ground_truth": 1}, {"key": "41028780", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6376090421924254, "res": {"Yes": 0.6376090421924254, "No": 0.36236648129452786}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6671903709974502, "res": {"Yes": 0.6671903709974502, "No": 0.33278092113457636}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.37041391848972616, "res": {"No": 0.6295679238800989, "Yes": 0.37041391848972616}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6214043386443565, "res": {"Yes": 0.6214043386443565, "No": 0.37856504933968155}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5861642433040509, "res": {"Yes": 0.5861642433040509, "No": 0.4138143233848244}, "ground_truth": 1}, {"key": "39457108", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7119935333393214, "res": {"Yes": 0.7119935333393214, "No": 0.28797937960593384}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5628764242784129, "res": {"Yes": 0.5628764242784129, "No": 0.43709535676069705}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.46077464268960777, "res": {"No": 0.5391976703289071, "Yes": 0.46077464268960777}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4796154701449817, "res": {"No": 0.5203476464093368, "Yes": 0.4796154701449817}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5217405214668018, "res": {"Yes": 0.5217405214668018, "No": 0.478214740243849}, "ground_truth": 1}, {"key": "38288018", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4886764817347521, "res": {"No": 0.5112765047178633, "Yes": 0.4886764817347521}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.453798868513007, "res": {"No": 0.546165754302226, "Yes": 0.453798868513007}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.22029960900614382, "res": {"No": 0.7796873211414225, "Yes": 0.22029960900614382}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6572580088846388, "res": {"Yes": 0.6572580088846388, "No": 0.3427192431800576}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7694884773648867, "res": {"Yes": 0.7694884773648867, "No": 0.23049170596294744}, "ground_truth": 1}, {"key": "40106293", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6346001521980666, "res": {"Yes": 0.6346001521980666, "No": 0.36538064711548646}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5524135657002917, "res": {"Yes": 0.5524135657002917, "No": 0.4475672380179201}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.47216914478310645, "res": {"No": 0.5278067690324417, "Yes": 0.47216914478310645}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6020941563538733, "res": {"Yes": 0.6020941563538733, "No": 0.3978779655245714}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7164028504148244, "res": {"Yes": 0.7164028504148244, "No": 0.28357461449055055}, "ground_truth": 1}, {"key": "39948797", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6459684793279284, "res": {"Yes": 0.6459684793279284, "No": 0.3539966249264096}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6797126116987038, "res": {"Yes": 0.6797126116987038, "No": 0.32026125320795285}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.12749845909322757, "res": {"No": 0.8724629412671387, "Yes": 0.12749845909322757}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3825204588333193, "res": {"No": 0.6174612163394073, "Yes": 0.3825204588333193}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5885253956657791, "res": {"Yes": 0.5885253956657791, "No": 0.41144979959526806}, "ground_truth": 1}, {"key": "31853399", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5838036666036813, "res": {"Yes": 0.5838036666036813, "No": 0.4161630410095028}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5754983257694603, "res": {"Yes": 0.5754983257694603, "No": 0.42447536835110145}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4419498079617976, "res": {"No": 0.5580240819029038, "Yes": 0.4419498079617976}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.578553069597615, "res": {"Yes": 0.578553069597615, "No": 0.42142245178380056}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4839889515026111, "res": {"No": 0.5159833920335739, "Yes": 0.4839889515026111}, "ground_truth": 1}, {"key": "35273252", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.570532981375756, "res": {"Yes": 0.570532981375756, "No": 0.4294337923345855}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.29073481963616804, "res": {"No": 0.7092416559307682, "Yes": 0.29073481963616804}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.45841230984708975, "res": {"No": 0.5415353516499114, "Yes": 0.45841230984708975}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.44039549655146865, "res": {"No": 0.5595661654752703, "Yes": 0.44039549655146865}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4895491565952024, "res": {"No": 0.5104058578696898, "Yes": 0.4895491565952024}, "ground_truth": 1}, {"key": "37130459", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5333152533317292, "res": {"Yes": 0.5333152533317292, "No": 0.4666569843889959}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5759823852022243, "res": {"Yes": 0.5759823852022243, "No": 0.42397596995104897}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5600872297347159, "res": {"Yes": 0.5600872297347159, "No": 0.4398875732765454}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6829664514619187, "res": {"Yes": 0.6829664514619187, "No": 0.3170139816265678}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7213731720027234, "res": {"Yes": 0.7213731720027234, "No": 0.27860206656117437}, "ground_truth": 1}, {"key": "21734003", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.575492432696777, "res": {"Yes": 0.575492432696777, "No": 0.42448559833074945}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5719554129663936, "res": {"Yes": 0.5719554129663936, "No": 0.42803096409535607}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.61907594747694, "res": {"Yes": 0.61907594747694, "No": 0.38089853944082797}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5528736083012887, "res": {"Yes": 0.5528736083012887, "No": 0.44710089229722894}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7083838650089915, "res": {"Yes": 0.7083838650089915, "No": 0.29159314131263253}, "ground_truth": 1}, {"key": "33990737", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6823859787379546, "res": {"Yes": 0.6823859787379546, "No": 0.31759083724804316}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3585705306780054, "res": {"No": 0.6414072104817142, "Yes": 0.3585705306780054}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.21553251481664548, "res": {"No": 0.7844492655222975, "Yes": 0.21553251481664548}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3806917448360205, "res": {"No": 0.6192829329700847, "Yes": 0.3806917448360205}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.34754417491467343, "res": {"No": 0.6524362602483265, "Yes": 0.34754417491467343}, "ground_truth": 1}, {"key": "34559912", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.45205153055292124, "res": {"No": 0.5479211167127735, "Yes": 0.45205153055292124}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.33608552927431323, "res": {"No": 0.6638906677939282, "Yes": 0.33608552927431323}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5414556597564809, "res": {"Yes": 0.5414556597564809, "No": 0.4585223557604543}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5018144746547573, "res": {"Yes": 0.5018144746547573, "No": 0.49816293836454706}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6992024993933225, "res": {"Yes": 0.6992024993933225, "No": 0.30076110513632265}, "ground_truth": 1}, {"key": "39820439", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5934981393403046, "res": {"Yes": 0.5934981393403046, "No": 0.40647974867213627}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5287846070911779, "res": {"Yes": 0.5287846070911779, "No": 0.4711825879007307}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6520922886911563, "res": {"Yes": 0.6520922886911563, "No": 0.3478840654400828}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5525709154893494, "res": {"Yes": 0.5525709154893494, "No": 0.44740107372822907}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5519316846808714, "res": {"Yes": 0.5519316846808714, "No": 0.448045069528966}, "ground_truth": 1}, {"key": "34759328", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5792976543492773, "res": {"Yes": 0.5792976543492773, "No": 0.42067500627631405}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.35625803260154915, "res": {"No": 0.6437221243000031, "Yes": 0.35625803260154915}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4811454999115701, "res": {"No": 0.5188401393135731, "Yes": 0.4811454999115701}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4108838532180818, "res": {"No": 0.589097425906367, "Yes": 0.4108838532180818}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5900884724613062, "res": {"Yes": 0.5900884724613062, "No": 0.4098891998805936}, "ground_truth": 1}, {"key": "36939137", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.705493797052048, "res": {"Yes": 0.705493797052048, "No": 0.2944836780520699}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5040459723955875, "res": {"Yes": 0.5040459723955875, "No": 0.49593153304553894}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2853906315960698, "res": {"No": 0.7145998809425246, "Yes": 0.2853906315960698}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5953049998402048, "res": {"Yes": 0.5953049998402048, "No": 0.4046655158087682}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.476372022564617, "res": {"No": 0.5236006204382986, "Yes": 0.476372022564617}, "ground_truth": 1}, {"key": "35851522", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8002507763486413, "res": {"Yes": 0.8002507763486413, "No": 0.19973192231164558}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8028881459045027, "res": {"Yes": 0.8028881459045027, "No": 0.19709837685338794}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3871963578511955, "res": {"No": 0.6127834917309297, "Yes": 0.3871963578511955}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5382053716338046, "res": {"Yes": 0.5382053716338046, "No": 0.4617796267855279}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6829856430888459, "res": {"Yes": 0.6829856430888459, "No": 0.3169980996239358}, "ground_truth": 1}, {"key": "22412782", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7970481324363108, "res": {"Yes": 0.7970481324363108, "No": 0.20292971325874473}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6900862425489187, "res": {"Yes": 0.6900862425489187, "No": 0.30989743223763383}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.22554546990255334, "res": {"No": 0.7744380418008662, "Yes": 0.22554546990255334}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5714295931068692, "res": {"Yes": 0.5714295931068692, "No": 0.42853888425880415}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4434023862965084, "res": {"No": 0.5565586627920455, "Yes": 0.4434023862965084}, "ground_truth": 1}, {"key": "38579227", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4373703762246535, "res": {"No": 0.5625960184524705, "Yes": 0.4373703762246535}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.47064692242449163, "res": {"No": 0.5293109566859627, "Yes": 0.47064692242449163}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2904918959445359, "res": {"No": 0.7094874791255393, "Yes": 0.2904918959445359}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5739052649068918, "res": {"Yes": 0.5739052649068918, "No": 0.4260625127218571}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.42485877474393385, "res": {"No": 0.5751080746116074, "Yes": 0.42485877474393385}, "ground_truth": 1}, {"key": "37206995", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.571174392510925, "res": {"Yes": 0.571174392510925, "No": 0.4287848504315382}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.44643293121189054, "res": {"No": 0.5535332258495234, "Yes": 0.44643293121189054}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6593165571183962, "res": {"Yes": 0.6593165571183962, "No": 0.3406530392119395}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.26736577881759976, "res": {"No": 0.7326000576097784, "Yes": 0.26736577881759976}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.35523355657032, "res": {"No": 0.6447126663297134, "Yes": 0.35523355657032}, "ground_truth": 1}, {"key": "38700847", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.33799898042423976, "res": {"No": 0.6619744162102463, "Yes": 0.33799898042423976}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4823637217819582, "res": {"No": 0.5175816802839307, "Yes": 0.4823637217819582}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.568411415154948, "res": {"Yes": 0.568411415154948, "No": 0.43148617861127075}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6125855456183582, "res": {"Yes": 0.6125855456183582, "No": 0.3873681911207433}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4567792026619541, "res": {"No": 0.5431323772965999, "Yes": 0.4567792026619541}, "ground_truth": 1}, {"key": "20246590", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4649931289293387, "res": {"No": 0.5349537684137272, "Yes": 0.4649931289293387}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4449029324212597, "res": {"No": 0.5550366674170224, "Yes": 0.4449029324212597}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.31661406733656666, "res": {"No": 0.6833641492986509, "Yes": 0.31661406733656666}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6035901324812412, "res": {"Yes": 0.6035901324812412, "No": 0.39637594976464}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4436208601176825, "res": {"No": 0.5563625883280517, "Yes": 0.4436208601176825}, "ground_truth": 1}, {"key": "39141360", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.395122276984249, "res": {"No": 0.6048602738130658, "Yes": 0.395122276984249}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6173121421525608, "res": {"Yes": 0.6173121421525608, "No": 0.38266667844160146}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6224269045173001, "res": {"Yes": 0.6224269045173001, "No": 0.37755557597620676}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4555968597464128, "res": {"No": 0.5443843477477236, "Yes": 0.4555968597464128}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.47477778759349104, "res": {"No": 0.5251924038528294, "Yes": 0.47477778759349104}, "ground_truth": 1}, {"key": "37906226", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4786935292565386, "res": {"No": 0.5212826343308216, "Yes": 0.4786935292565386}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6043479021093874, "res": {"Yes": 0.6043479021093874, "No": 0.39562353068459083}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.49314799366381096, "res": {"No": 0.5068437035194775, "Yes": 0.49314799366381096}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6626145701486797, "res": {"Yes": 0.6626145701486797, "No": 0.33736444290656287}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6598822625175507, "res": {"Yes": 0.6598822625175507, "No": 0.3401041788238251}, "ground_truth": 1}, {"key": "16201033", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7553229899165415, "res": {"Yes": 0.7553229899165415, "No": 0.24466244352052344}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6297057891656522, "res": {"Yes": 0.6297057891656522, "No": 0.3702760205419202}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.40613303525971894, "res": {"No": 0.5938475751739977, "Yes": 0.40613303525971894}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5185035524177292, "res": {"Yes": 0.5185035524177292, "No": 0.48146935241411953}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6200179932457491, "res": {"Yes": 0.6200179932457491, "No": 0.3799612139589999}, "ground_truth": 1}, {"key": "36469022", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5435961114828266, "res": {"Yes": 0.5435961114828266, "No": 0.4563851038008603}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4957935345032802, "res": {"No": 0.5041854813809561, "Yes": 0.4957935345032802}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.09417151798179825, "res": {"No": 0.9057859945018871, "Yes": 0.09417151798179825}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4313600003011969, "res": {"No": 0.568596463185514, "Yes": 0.4313600003011969}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5260651576799039, "res": {"Yes": 0.5260651576799039, "No": 0.47390065398652415}, "ground_truth": 1}, {"key": "31295270", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5644190200380395, "res": {"Yes": 0.5644190200380395, "No": 0.43555482536202156}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.452728124652966, "res": {"No": 0.5472308698858196, "Yes": 0.452728124652966}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.283490972317103, "res": {"No": 0.7164961536333411, "Yes": 0.283490972317103}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7792584006210883, "res": {"Yes": 0.7792584006210883, "No": 0.2207199887594163}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7216045751271584, "res": {"Yes": 0.7216045751271584, "No": 0.27837426325498194}, "ground_truth": 1}, {"key": "35360689", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7243013818069926, "res": {"Yes": 0.7243013818069926, "No": 0.27566991200649016}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5138819033218928, "res": {"Yes": 0.5138819033218928, "No": 0.4861013440346846}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5525898137378173, "res": {"Yes": 0.5525898137378173, "No": 0.4473856520790113}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6875505258475053, "res": {"Yes": 0.6875505258475053, "No": 0.31241673290969957}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.71329355871477, "res": {"Yes": 0.71329355871477, "No": 0.28667308188055296}, "ground_truth": 1}, {"key": "29202793", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.685567374236846, "res": {"Yes": 0.685567374236846, "No": 0.3144058851285557}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7764104796751312, "res": {"Yes": 0.7764104796751312, "No": 0.2235439589339714}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.44361939617125956, "res": {"No": 0.5563607634617549, "Yes": 0.44361939617125956}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5593050209451017, "res": {"Yes": 0.5593050209451017, "No": 0.4406704772329585}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.750850931697191, "res": {"Yes": 0.750850931697191, "No": 0.24912689346909714}, "ground_truth": 1}, {"key": "35999008", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.644877082573859, "res": {"Yes": 0.644877082573859, "No": 0.35510395549268214}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5418024106529759, "res": {"Yes": 0.5418024106529759, "No": 0.45818109916457056}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5127069728661017, "res": {"Yes": 0.5127069728661017, "No": 0.4872774040002554}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7068719831429326, "res": {"Yes": 0.7068719831429326, "No": 0.2931036143161411}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7170582861392254, "res": {"Yes": 0.7170582861392254, "No": 0.2829152206202849}, "ground_truth": 1}, {"key": "31797119", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6965967406512197, "res": {"Yes": 0.6965967406512197, "No": 0.3033811024298932}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6047025468221491, "res": {"Yes": 0.6047025468221491, "No": 0.3952656731165228}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5284840784753997, "res": {"Yes": 0.5284840784753997, "No": 0.4714945197442655}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.640581590578143, "res": {"Yes": 0.640581590578143, "No": 0.35938921982666305}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4741205332766493, "res": {"No": 0.5258436256934007, "Yes": 0.4741205332766493}, "ground_truth": 1}, {"key": "26711893", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4151290804020833, "res": {"No": 0.5848410371754168, "Yes": 0.4151290804020833}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5398838473827181, "res": {"Yes": 0.5398838473827181, "No": 0.46008681916151495}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6662804306656949, "res": {"Yes": 0.6662804306656949, "No": 0.33369589325438914}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7474972893585932, "res": {"Yes": 0.7474972893585932, "No": 0.25248410064294186}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7252136122053159, "res": {"Yes": 0.7252136122053159, "No": 0.2747622501937268}, "ground_truth": 1}, {"key": "35348288", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7741737324888557, "res": {"Yes": 0.7741737324888557, "No": 0.22580718671115882}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7463596204410239, "res": {"Yes": 0.7463596204410239, "No": 0.2536228900608471}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5005528957485125, "res": {"Yes": 0.5005528957485125, "No": 0.49941805919806886}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4994711201912281, "res": {"No": 0.5004829233448718, "Yes": 0.4994711201912281}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6102810318239315, "res": {"Yes": 0.6102810318239315, "No": 0.389670565760271}, "ground_truth": 1}, {"key": "38124131", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6520683051778378, "res": {"Yes": 0.6520683051778378, "No": 0.347903756235431}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5586194370882939, "res": {"Yes": 0.5586194370882939, "No": 0.4413416707077378}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4312858860800508, "res": {"No": 0.5686972274062367, "Yes": 0.4312858860800508}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4900950632802216, "res": {"No": 0.5098807317126993, "Yes": 0.4900950632802216}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6032236593483412, "res": {"Yes": 0.6032236593483412, "No": 0.3967523208259146}, "ground_truth": 1}, {"key": "20285901", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6359292588828158, "res": {"Yes": 0.6359292588828158, "No": 0.3640505672418248}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.24946192017199986, "res": {"No": 0.7505210802714686, "Yes": 0.24946192017199986}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5285021000897424, "res": {"Yes": 0.5285021000897424, "No": 0.4714737272944216}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5268866705295848, "res": {"Yes": 0.5268866705295848, "No": 0.4730870591628263}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6694195803735309, "res": {"Yes": 0.6694195803735309, "No": 0.33055027938182097}, "ground_truth": 1}, {"key": "35633632", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4754333381451324, "res": {"No": 0.5245501189703887, "Yes": 0.4754333381451324}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.48788856969092687, "res": {"No": 0.5120894818370504, "Yes": 0.48788856969092687}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6602047663727275, "res": {"Yes": 0.6602047663727275, "No": 0.3397710399932669}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6638954279070812, "res": {"Yes": 0.6638954279070812, "No": 0.33607702641798415}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6891431118710741, "res": {"Yes": 0.6891431118710741, "No": 0.31083330726445024}, "ground_truth": 1}, {"key": "10741274", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7454611192954346, "res": {"Yes": 0.7454611192954346, "No": 0.2545191500617969}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6448609801941462, "res": {"Yes": 0.6448609801941462, "No": 0.35511272666870636}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5962657035116172, "res": {"Yes": 0.5962657035116172, "No": 0.4037137305239467}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7163329687253013, "res": {"Yes": 0.7163329687253013, "No": 0.2836399859729645}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.603720008869196, "res": {"Yes": 0.603720008869196, "No": 0.3962556084792343}, "ground_truth": 1}, {"key": "30605795", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7403629796541292, "res": {"Yes": 0.7403629796541292, "No": 0.2596163797586397}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6829289849501073, "res": {"Yes": 0.6829289849501073, "No": 0.31704616017873677}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.554378950445029, "res": {"Yes": 0.554378950445029, "No": 0.4456038590771648}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5208954443488447, "res": {"Yes": 0.5208954443488447, "No": 0.4790793872105202}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.555289877381174, "res": {"Yes": 0.555289877381174, "No": 0.4446875403322534}, "ground_truth": 1}, {"key": "30539722", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5807311301894044, "res": {"Yes": 0.5807311301894044, "No": 0.4192474125138794}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6210750008659423, "res": {"Yes": 0.6210750008659423, "No": 0.378900276959929}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.24139361995924719, "res": {"No": 0.7585800640471213, "Yes": 0.24139361995924719}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6894847910035267, "res": {"Yes": 0.6894847910035267, "No": 0.3104824502934518}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5950114083040897, "res": {"Yes": 0.5950114083040897, "No": 0.4049568948536733}, "ground_truth": 1}, {"key": "18639299", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7370250265812027, "res": {"Yes": 0.7370250265812027, "No": 0.26294226384786024}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.48107100510990014, "res": {"No": 0.5188953779751062, "Yes": 0.48107100510990014}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5220887637800259, "res": {"Yes": 0.5220887637800259, "No": 0.4778352840091482}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7775803470583588, "res": {"Yes": 0.7775803470583588, "No": 0.22234325445367836}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5350897816486431, "res": {"Yes": 0.5350897816486431, "No": 0.46485681757740704}, "ground_truth": 1}, {"key": "39773552", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6542287814279905, "res": {"Yes": 0.6542287814279905, "No": 0.3457084808352865}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6780637831663281, "res": {"Yes": 0.6780637831663281, "No": 0.3218599712230742}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.36778994699081385, "res": {"No": 0.6322005115768388, "Yes": 0.36778994699081385}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7806479726503731, "res": {"Yes": 0.7806479726503731, "No": 0.21933426250256935}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7105340774238542, "res": {"Yes": 0.7105340774238542, "No": 0.2894470500729466}, "ground_truth": 1}, {"key": "34086410", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8250333658588486, "res": {"Yes": 0.8250333658588486, "No": 0.17495221491048912}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7634118623136094, "res": {"Yes": 0.7634118623136094, "No": 0.23657111939459607}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5734152500813374, "res": {"Yes": 0.5734152500813374, "No": 0.42655865292214634}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5405890503334627, "res": {"Yes": 0.5405890503334627, "No": 0.4593926444801335}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6446941633417088, "res": {"Yes": 0.6446941633417088, "No": 0.3552849981135892}, "ground_truth": 1}, {"key": "35454652", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6551936095008004, "res": {"Yes": 0.6551936095008004, "No": 0.34478039529577326}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6546773893668723, "res": {"Yes": 0.6546773893668723, "No": 0.34529947327501326}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.18879653088298726, "res": {"No": 0.8111945618512294, "Yes": 0.18879653088298726}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7141233446155433, "res": {"Yes": 0.7141233446155433, "No": 0.28585331052581603}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6063353276470579, "res": {"Yes": 0.6063353276470579, "No": 0.3936441462128062}, "ground_truth": 1}, {"key": "36158310", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6072648481119126, "res": {"Yes": 0.6072648481119126, "No": 0.3927090783071956}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.734049334067696, "res": {"Yes": 0.734049334067696, "No": 0.26592451198669714}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.03632528222912074, "res": {"No": 0.9636474047370435, "Yes": 0.03632528222912074}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3238788023471631, "res": {"No": 0.6760960008029177, "Yes": 0.3238788023471631}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6681131590610666, "res": {"Yes": 0.6681131590610666, "No": 0.3318584687176967}, "ground_truth": 1}, {"key": "35688387", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4608086168564555, "res": {"No": 0.5391582240703076, "Yes": 0.4608086168564555}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.419145296282453, "res": {"No": 0.5808200469318393, "Yes": 0.419145296282453}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.34989614398625973, "res": {"No": 0.6500912248610158, "Yes": 0.34989614398625973}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.852530596624407, "res": {"Yes": 0.852530596624407, "No": 0.14743921350119446}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8113800464667713, "res": {"Yes": 0.8113800464667713, "No": 0.18859457005460004}, "ground_truth": 1}, {"key": "34209292", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7745395772836517, "res": {"Yes": 0.7745395772836517, "No": 0.2254374144055409}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7953217732412904, "res": {"Yes": 0.7953217732412904, "No": 0.20465134579177333}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3693676239584399, "res": {"No": 0.630614637575846, "Yes": 0.3693676239584399}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7506656745792486, "res": {"Yes": 0.7506656745792486, "No": 0.24931066738945828}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7645894697870906, "res": {"Yes": 0.7645894697870906, "No": 0.23539371117431915}, "ground_truth": 1}, {"key": "25037859", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7128555027828168, "res": {"Yes": 0.7128555027828168, "No": 0.28712888137419573}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6877422141483646, "res": {"Yes": 0.6877422141483646, "No": 0.31223271118879187}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5203056508455489, "res": {"Yes": 0.5203056508455489, "No": 0.4796764811129995}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6131532342362706, "res": {"Yes": 0.6131532342362706, "No": 0.38682893968043297}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6862528521696267, "res": {"Yes": 0.6862528521696267, "No": 0.3137229523191418}, "ground_truth": 1}, {"key": "36412121", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6604005857329025, "res": {"Yes": 0.6604005857329025, "No": 0.3395705323340168}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6916889628909588, "res": {"Yes": 0.6916889628909588, "No": 0.3082798514313782}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7117265146474523, "res": {"Yes": 0.7117265146474523, "No": 0.28824882389425255}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7682530560827164, "res": {"Yes": 0.7682530560827164, "No": 0.23172487376094467}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6027710133890778, "res": {"Yes": 0.6027710133890778, "No": 0.39720317237404523}, "ground_truth": 1}, {"key": "34909172", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7321147170633794, "res": {"Yes": 0.7321147170633794, "No": 0.2678581043676916}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7528248132321447, "res": {"Yes": 0.7528248132321447, "No": 0.2471497378306281}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.43178562600648746, "res": {"No": 0.5681845506031954, "Yes": 0.43178562600648746}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3755795197093831, "res": {"No": 0.6243790581880256, "Yes": 0.3755795197093831}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.44872233055993616, "res": {"No": 0.5512172303859211, "Yes": 0.44872233055993616}, "ground_truth": 1}, {"key": "39011806", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.42910453002602844, "res": {"No": 0.5708430361632939, "Yes": 0.42910453002602844}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.44363940385719686, "res": {"No": 0.5563084012509021, "Yes": 0.44363940385719686}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7378813940254331, "res": {"Yes": 0.7378813940254331, "No": 0.2621039757340459}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8507733241423757, "res": {"Yes": 0.8507733241423757, "No": 0.14920768268669524}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8588470145559332, "res": {"Yes": 0.8588470145559332, "No": 0.1411422827334699}, "ground_truth": 1}, {"key": "33096163", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.849174786907059, "res": {"Yes": 0.849174786907059, "No": 0.15080819219248073}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7081753970666931, "res": {"Yes": 0.7081753970666931, "No": 0.29181107194635875}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5601157389002616, "res": {"Yes": 0.5601157389002616, "No": 0.4398680251071525}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6497409071116097, "res": {"Yes": 0.6497409071116097, "No": 0.3502415919171221}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7030080192872835, "res": {"Yes": 0.7030080192872835, "No": 0.29696176079518233}, "ground_truth": 1}, {"key": "38762205", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6854091772532717, "res": {"Yes": 0.6854091772532717, "No": 0.31456844354018065}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6182527960917859, "res": {"Yes": 0.6182527960917859, "No": 0.3817272502421301}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4360485014335266, "res": {"No": 0.5639400936827763, "Yes": 0.4360485014335266}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7575671489870021, "res": {"Yes": 0.7575671489870021, "No": 0.24242182299065368}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6502037653921412, "res": {"Yes": 0.6502037653921412, "No": 0.34977251253593894}, "ground_truth": 1}, {"key": "35519177", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7133603974525675, "res": {"Yes": 0.7133603974525675, "No": 0.286619565012121}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6108065207142889, "res": {"Yes": 0.6108065207142889, "No": 0.38917755496569945}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.42675384815336276, "res": {"No": 0.5732171865293694, "Yes": 0.42675384815336276}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5601853544101102, "res": {"Yes": 0.5601853544101102, "No": 0.4397867845874341}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6079710398354448, "res": {"Yes": 0.6079710398354448, "No": 0.39200513491676797}, "ground_truth": 1}, {"key": "36192531", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6887098942324356, "res": {"Yes": 0.6887098942324356, "No": 0.31126719118674273}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7401464847566916, "res": {"Yes": 0.7401464847566916, "No": 0.2598272478876994}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6634170180663341, "res": {"Yes": 0.6634170180663341, "No": 0.3365350751883697}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6957307270012932, "res": {"Yes": 0.6957307270012932, "No": 0.3042235457347408}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7250794673473052, "res": {"Yes": 0.7250794673473052, "No": 0.27486970323925397}, "ground_truth": 1}, {"key": "33160852", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7403041009277009, "res": {"Yes": 0.7403041009277009, "No": 0.2596546759989324}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6302213513227641, "res": {"Yes": 0.6302213513227641, "No": 0.3697298556041711}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5032416030731741, "res": {"Yes": 0.5032416030731741, "No": 0.49673966649054874}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6171806871841258, "res": {"Yes": 0.6171806871841258, "No": 0.38280054334798336}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5293287153664596, "res": {"Yes": 0.5293287153664596, "No": 0.47065285261307427}, "ground_truth": 1}, {"key": "36312304", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5931871091437991, "res": {"Yes": 0.5931871091437991, "No": 0.4067877818672734}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6212919367665521, "res": {"Yes": 0.6212919367665521, "No": 0.37867712118010016}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5875597711565429, "res": {"Yes": 0.5875597711565429, "No": 0.41242255346922396}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7545412275905026, "res": {"Yes": 0.7545412275905026, "No": 0.24544072670062445}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7117790206490978, "res": {"Yes": 0.7117790206490978, "No": 0.28819368716823757}, "ground_truth": 1}, {"key": "33773343", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6260695448768812, "res": {"Yes": 0.6260695448768812, "No": 0.37391381099901877}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5768545061441585, "res": {"Yes": 0.5768545061441585, "No": 0.42312631393870237}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4816478180237591, "res": {"No": 0.5183258605946668, "Yes": 0.4816478180237591}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6645691586643996, "res": {"Yes": 0.6645691586643996, "No": 0.3354083614897256}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5681690109682419, "res": {"Yes": 0.5681690109682419, "No": 0.4318034634391274}, "ground_truth": 1}, {"key": "34913320", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6208160355413289, "res": {"Yes": 0.6208160355413289, "No": 0.37916297618915945}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4254080427803155, "res": {"No": 0.5745745069638063, "Yes": 0.4254080427803155}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4931725974309507, "res": {"No": 0.5068129136997389, "Yes": 0.4931725974309507}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6862859646685765, "res": {"Yes": 0.6862859646685765, "No": 0.31369559687041454}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5879137062098819, "res": {"Yes": 0.5879137062098819, "No": 0.4120685335080542}, "ground_truth": 1}, {"key": "33784155", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6669829470733608, "res": {"Yes": 0.6669829470733608, "No": 0.33299999633756383}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5508247932378966, "res": {"Yes": 0.5508247932378966, "No": 0.44915954063433117}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.39337933643159406, "res": {"No": 0.6065842551295363, "Yes": 0.39337933643159406}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.39241781979516743, "res": {"No": 0.6075104513786171, "Yes": 0.39241781979516743}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5826861929898327, "res": {"Yes": 0.5826861929898327, "No": 0.41724118211534733}, "ground_truth": 1}, {"key": "24085062", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5743078226578328, "res": {"Yes": 0.5743078226578328, "No": 0.4256317258127429}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5829672903218844, "res": {"Yes": 0.5829672903218844, "No": 0.4169753381747431}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.49097689957654767, "res": {"No": 0.5090067302621868, "Yes": 0.49097689957654767}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7651506778811873, "res": {"Yes": 0.7651506778811873, "No": 0.23482942017642397}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6804423483663117, "res": {"Yes": 0.6804423483663117, "No": 0.3195349249087746}, "ground_truth": 1}, {"key": "33893487", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7052151115107868, "res": {"Yes": 0.7052151115107868, "No": 0.2947651032486212}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.47749418363722007, "res": {"No": 0.5224798815996374, "Yes": 0.47749418363722007}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.40004021477106133, "res": {"No": 0.5999453147518095, "Yes": 0.40004021477106133}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.2490116242181617, "res": {"No": 0.7509731876893596, "Yes": 0.2490116242181617}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4272859832226331, "res": {"No": 0.5726875493981389, "Yes": 0.4272859832226331}, "ground_truth": 1}, {"key": "40913011", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3844048057550187, "res": {"No": 0.6155778738975608, "Yes": 0.3844048057550187}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4194869760170889, "res": {"No": 0.5804891551098561, "Yes": 0.4194869760170889}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7364239552041598, "res": {"Yes": 0.7364239552041598, "No": 0.2635574785168103}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6475030726592581, "res": {"Yes": 0.6475030726592581, "No": 0.35247739022239966}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6333282872673884, "res": {"Yes": 0.6333282872673884, "No": 0.36664998696278}, "ground_truth": 1}, {"key": "29642545", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5958228426370964, "res": {"Yes": 0.5958228426370964, "No": 0.4041524745381185}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7095573883708799, "res": {"Yes": 0.7095573883708799, "No": 0.29042299943826655}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6267916689433363, "res": {"Yes": 0.6267916689433363, "No": 0.37318733754215927}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6966178130213424, "res": {"Yes": 0.6966178130213424, "No": 0.3033636888543881}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7215128433685751, "res": {"Yes": 0.7215128433685751, "No": 0.2784636635833677}, "ground_truth": 1}, {"key": "35969159", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7762153767110446, "res": {"Yes": 0.7762153767110446, "No": 0.2237611926637662}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5534330232649272, "res": {"Yes": 0.5534330232649272, "No": 0.44654371835935114}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3539363798278505, "res": {"No": 0.6460297781852101, "Yes": 0.3539363798278505}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7157898791249729, "res": {"Yes": 0.7157898791249729, "No": 0.28418552416397735}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7786429906560096, "res": {"Yes": 0.7786429906560096, "No": 0.22132694091478342}, "ground_truth": 1}, {"key": "37081669", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7398933831413497, "res": {"Yes": 0.7398933831413497, "No": 0.26008046892114833}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6464718331065598, "res": {"Yes": 0.6464718331065598, "No": 0.3535030025164388}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5322248971317403, "res": {"Yes": 0.5322248971317403, "No": 0.467753074918125}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6595368715816112, "res": {"Yes": 0.6595368715816112, "No": 0.34043815494731217}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7018822458365443, "res": {"Yes": 0.7018822458365443, "No": 0.29809376330590837}, "ground_truth": 1}, {"key": "40048022", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7566862094812975, "res": {"Yes": 0.7566862094812975, "No": 0.24328567715417712}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6201482230996489, "res": {"Yes": 0.6201482230996489, "No": 0.3798265035980886}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5915656575197052, "res": {"Yes": 0.5915656575197052, "No": 0.4084180241889854}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7501593262596774, "res": {"Yes": 0.7501593262596774, "No": 0.24982440197819575}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.698076809507232, "res": {"Yes": 0.698076809507232, "No": 0.30190900951554644}, "ground_truth": 1}, {"key": "32884004", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6555029011041495, "res": {"Yes": 0.6555029011041495, "No": 0.34448225475508776}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6994122426515409, "res": {"Yes": 0.6994122426515409, "No": 0.3005685593843236}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.8246307488430085, "res": {"Yes": 0.8246307488430085, "No": 0.17534945683597106}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8178323700246101, "res": {"Yes": 0.8178323700246101, "No": 0.1821461121458381}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5226408563200226, "res": {"Yes": 0.5226408563200226, "No": 0.4773371138901936}, "ground_truth": 1}, {"key": "39022490", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.58767088921515, "res": {"Yes": 0.58767088921515, "No": 0.41230312494456767}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5429511642593728, "res": {"Yes": 0.5429511642593728, "No": 0.45701804641249194}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5944786773624916, "res": {"Yes": 0.5944786773624916, "No": 0.40549821800443003}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6359256023000899, "res": {"Yes": 0.6359256023000899, "No": 0.3640561008525022}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6880722307529337, "res": {"Yes": 0.6880722307529337, "No": 0.3119104349039483}, "ground_truth": 1}, {"key": "35159385", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6090252626187533, "res": {"Yes": 0.6090252626187533, "No": 0.3909525624556182}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5121659937209322, "res": {"Yes": 0.5121659937209322, "No": 0.4878163138659071}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5481112235202806, "res": {"Yes": 0.5481112235202806, "No": 0.4518712612329453}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7831305549851709, "res": {"Yes": 0.7831305549851709, "No": 0.21684787676715483}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7218553690726397, "res": {"Yes": 0.7218553690726397, "No": 0.27812333850335436}, "ground_truth": 1}, {"key": "34363669", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.827042760279063, "res": {"Yes": 0.827042760279063, "No": 0.17293651796595225}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7256429424101434, "res": {"Yes": 0.7256429424101434, "No": 0.27433875612657077}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.34969193423202777, "res": {"No": 0.6502932525918075, "Yes": 0.34969193423202777}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5343606999375289, "res": {"Yes": 0.5343606999375289, "No": 0.4656201062363379}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5964523042424079, "res": {"Yes": 0.5964523042424079, "No": 0.4035274757637251}, "ground_truth": 1}, {"key": "36119687", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5651562937406457, "res": {"Yes": 0.5651562937406457, "No": 0.43482470766199816}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5412081086901396, "res": {"Yes": 0.5412081086901396, "No": 0.45877100187835285}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.45006019432359, "res": {"No": 0.5499170116771863, "Yes": 0.45006019432359}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8446842585275427, "res": {"Yes": 0.8446842585275427, "No": 0.15529595430560786}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8267267414688204, "res": {"Yes": 0.8267267414688204, "No": 0.17325366270174186}, "ground_truth": 1}, {"key": "35217446", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8689275664087909, "res": {"Yes": 0.8689275664087909, "No": 0.13105338758311014}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8486122761179204, "res": {"Yes": 0.8486122761179204, "No": 0.15136367410858007}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5423664494515577, "res": {"Yes": 0.5423664494515577, "No": 0.4576068635556856}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6355366874270375, "res": {"Yes": 0.6355366874270375, "No": 0.36444118448166335}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5810004195578127, "res": {"Yes": 0.5810004195578127, "No": 0.4189724722104505}, "ground_truth": 1}, {"key": "39049331", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4026180231050033, "res": {"No": 0.5973586453411981, "Yes": 0.4026180231050033}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3271575237730735, "res": {"No": 0.6727987353547712, "Yes": 0.3271575237730735}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6874155248062557, "res": {"Yes": 0.6874155248062557, "No": 0.31255979003330275}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6205335043909189, "res": {"Yes": 0.6205335043909189, "No": 0.3794352181044491}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5281207121022449, "res": {"Yes": 0.5281207121022449, "No": 0.47185471404795387}, "ground_truth": 1}, {"key": "36472242", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5270451291744762, "res": {"Yes": 0.5270451291744762, "No": 0.47293518002374096}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6841647005959314, "res": {"Yes": 0.6841647005959314, "No": 0.31581420410674377}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5207556756024084, "res": {"Yes": 0.5207556756024084, "No": 0.47922225081765907}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7059980101339641, "res": {"Yes": 0.7059980101339641, "No": 0.2939794829391102}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6462104204413995, "res": {"Yes": 0.6462104204413995, "No": 0.3537673447964384}, "ground_truth": 1}, {"key": "31854721", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7444180848326098, "res": {"Yes": 0.7444180848326098, "No": 0.2555581505823494}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.83140369322302, "res": {"Yes": 0.83140369322302, "No": 0.16857903309748287}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.26498631389734356, "res": {"No": 0.7349907756383198, "Yes": 0.26498631389734356}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5671762369528598, "res": {"Yes": 0.5671762369528598, "No": 0.43279134038613515}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7214265339498238, "res": {"Yes": 0.7214265339498238, "No": 0.2785498614256748}, "ground_truth": 1}, {"key": "18725849", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7095526556388831, "res": {"Yes": 0.7095526556388831, "No": 0.29042270901541234}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6624894538271077, "res": {"Yes": 0.6624894538271077, "No": 0.3374911807912033}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5456305394249692, "res": {"Yes": 0.5456305394249692, "No": 0.4543479340029061}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6761290965121679, "res": {"Yes": 0.6761290965121679, "No": 0.3238532493177381}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8392282831111163, "res": {"Yes": 0.8392282831111163, "No": 0.1607479610381349}, "ground_truth": 1}, {"key": "36883179", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7383914315036318, "res": {"Yes": 0.7383914315036318, "No": 0.2615871974520876}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6752116781578938, "res": {"Yes": 0.6752116781578938, "No": 0.32476202358193207}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5043124058818875, "res": {"Yes": 0.5043124058818875, "No": 0.4956639510106614}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.623825030357667, "res": {"Yes": 0.623825030357667, "No": 0.3761470205185875}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.43115520900632337, "res": {"No": 0.5688166891173109, "Yes": 0.43115520900632337}, "ground_truth": 1}, {"key": "34266359", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4830537248219047, "res": {"No": 0.5169240605906232, "Yes": 0.4830537248219047}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5005731184939974, "res": {"Yes": 0.5005731184939974, "No": 0.4994029969765429}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6071806020311713, "res": {"Yes": 0.6071806020311713, "No": 0.3927879264962729}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.772028455639502, "res": {"Yes": 0.772028455639502, "No": 0.22793754796107246}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8134101232400254, "res": {"Yes": 0.8134101232400254, "No": 0.18655712248717266}, "ground_truth": 1}, {"key": "31920289", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6568504775738829, "res": {"Yes": 0.6568504775738829, "No": 0.34310965123603393}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5268448373887423, "res": {"Yes": 0.5268448373887423, "No": 0.4731171721124765}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.47073451796726723, "res": {"No": 0.5292428705038917, "Yes": 0.47073451796726723}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.49533441433637887, "res": {"No": 0.5046350420410499, "Yes": 0.49533441433637887}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.690679833848594, "res": {"Yes": 0.690679833848594, "No": 0.309289669333268}, "ground_truth": 1}, {"key": "36292997", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6980376066144377, "res": {"Yes": 0.6980376066144377, "No": 0.30193123083638135}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6236435112114644, "res": {"Yes": 0.6236435112114644, "No": 0.3763252812035307}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5553892442885291, "res": {"Yes": 0.5553892442885291, "No": 0.44459325433635194}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5822082659425101, "res": {"Yes": 0.5822082659425101, "No": 0.41776339390910966}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7105539371288563, "res": {"Yes": 0.7105539371288563, "No": 0.28942198504374167}, "ground_truth": 1}, {"key": "30412533", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.795692264718543, "res": {"Yes": 0.795692264718543, "No": 0.2042785653880038}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7109810515186926, "res": {"Yes": 0.7109810515186926, "No": 0.28898791741392765}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3651246050350926, "res": {"No": 0.6348525130373277, "Yes": 0.3651246050350926}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4831430980277634, "res": {"No": 0.5168343458675441, "Yes": 0.4831430980277634}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4956782263380142, "res": {"No": 0.5042980583980341, "Yes": 0.4956782263380142}, "ground_truth": 1}, {"key": "40433191", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.38047081740853306, "res": {"No": 0.619506986706464, "Yes": 0.38047081740853306}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45180337719423436, "res": {"No": 0.5481783602943094, "Yes": 0.45180337719423436}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6635905906605657, "res": {"Yes": 0.6635905906605657, "No": 0.3363805064819785}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.628857920094265, "res": {"Yes": 0.628857920094265, "No": 0.3711093558887084}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7487290050092738, "res": {"Yes": 0.7487290050092738, "No": 0.2512347042673338}, "ground_truth": 1}, {"key": "34565591", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.804425170941491, "res": {"Yes": 0.804425170941491, "No": 0.1955502889802126}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4052745947067627, "res": {"No": 0.5946950356254452, "Yes": 0.4052745947067627}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.29064987933225317, "res": {"No": 0.709340119691656, "Yes": 0.29064987933225317}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8280064705114967, "res": {"Yes": 0.8280064705114967, "No": 0.17197325645234937}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7474939704779964, "res": {"Yes": 0.7474939704779964, "No": 0.2524810456038071}, "ground_truth": 1}, {"key": "36062480", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6228948839701667, "res": {"Yes": 0.6228948839701667, "No": 0.3770885268006306}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.39069311472374857, "res": {"No": 0.6092843178724968, "Yes": 0.39069311472374857}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.45546910096757925, "res": {"No": 0.5445099843752064, "Yes": 0.45546910096757925}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4683608421127926, "res": {"No": 0.531613902661035, "Yes": 0.4683608421127926}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5591782408679182, "res": {"Yes": 0.5591782408679182, "No": 0.44079836513905674}, "ground_truth": 1}, {"key": "37276883", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6093619212649002, "res": {"Yes": 0.6093619212649002, "No": 0.39060502335905306}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5476034419877683, "res": {"Yes": 0.5476034419877683, "No": 0.45236631317071846}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.36294125128689797, "res": {"No": 0.6370449249962666, "Yes": 0.36294125128689797}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6937000892035002, "res": {"Yes": 0.6937000892035002, "No": 0.3062820100417497}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7965560354529286, "res": {"Yes": 0.7965560354529286, "No": 0.20342739888299546}, "ground_truth": 1}, {"key": "38509260", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7545940322332223, "res": {"Yes": 0.7545940322332223, "No": 0.24538813438836}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5936683790178702, "res": {"Yes": 0.5936683790178702, "No": 0.4063048252427619}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5246102043820414, "res": {"Yes": 0.5246102043820414, "No": 0.4753472449635672}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3855435971098737, "res": {"No": 0.6144094293605025, "Yes": 0.3855435971098737}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.32142144634864533, "res": {"No": 0.6785297526786626, "Yes": 0.32142144634864533}, "ground_truth": 1}, {"key": "37139607", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.35047976709787904, "res": {"No": 0.6494750355648118, "Yes": 0.35047976709787904}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.29801325905302817, "res": {"No": 0.7019349381145192, "Yes": 0.29801325905302817}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.04347237065681313, "res": {"No": 0.9564679703181902, "Yes": 0.04347237065681313}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.2088039929150769, "res": {"No": 0.7911610966030534, "Yes": 0.2088039929150769}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.11688246754280605, "res": {"No": 0.8830736085158309, "Yes": 0.11688246754280605}, "ground_truth": 1}, {"key": "37092824", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.1335958074144999, "res": {"No": 0.8663702598535401, "Yes": 0.1335958074144999}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.15880141811718534, "res": {"No": 0.8411649522613363, "Yes": 0.15880141811718534}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3657123074115559, "res": {"No": 0.6342693579242719, "Yes": 0.3657123074115559}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.22809846025989525, "res": {"No": 0.771885659023444, "Yes": 0.22809846025989525}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4108733182911436, "res": {"No": 0.5890980444589891, "Yes": 0.4108733182911436}, "ground_truth": 1}, {"key": "32191802", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.26381641907972164, "res": {"No": 0.7361667377904303, "Yes": 0.26381641907972164}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.3047006986749984, "res": {"No": 0.6952806235641864, "Yes": 0.3047006986749984}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5509984626180464, "res": {"Yes": 0.5509984626180464, "No": 0.44898333847585353}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6190475449240292, "res": {"Yes": 0.6190475449240292, "No": 0.3809341170258591}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6634336965798163, "res": {"Yes": 0.6634336965798163, "No": 0.33654803203818223}, "ground_truth": 1}, {"key": "39396038", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7081235676061041, "res": {"Yes": 0.7081235676061041, "No": 0.2918548468901894}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7310949405736503, "res": {"Yes": 0.7310949405736503, "No": 0.26888607556423444}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4701961645360173, "res": {"No": 0.5297883191747491, "Yes": 0.4701961645360173}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7701421583045954, "res": {"Yes": 0.7701421583045954, "No": 0.22983767042506983}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.817952223961597, "res": {"Yes": 0.817952223961597, "No": 0.1820269365199165}, "ground_truth": 1}, {"key": "39076884", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6683891868866506, "res": {"Yes": 0.6683891868866506, "No": 0.33158864479150923}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6203777576192419, "res": {"Yes": 0.6203777576192419, "No": 0.3796027377785926}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7839006567418654, "res": {"Yes": 0.7839006567418654, "No": 0.21608254316804548}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7831844440526915, "res": {"Yes": 0.7831844440526915, "No": 0.21680572563713388}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6348292969054355, "res": {"Yes": 0.6348292969054355, "No": 0.36515516724354463}, "ground_truth": 1}, {"key": "27763432", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7195250481410608, "res": {"Yes": 0.7195250481410608, "No": 0.2804569617045489}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8026354926792025, "res": {"Yes": 0.8026354926792025, "No": 0.19735342935573766}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5146864493232481, "res": {"Yes": 0.5146864493232481, "No": 0.48525578272620284}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4489019002849212, "res": {"No": 0.5510477571454235, "Yes": 0.4489019002849212}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4577717873254303, "res": {"No": 0.5421791321632915, "Yes": 0.4577717873254303}, "ground_truth": 1}, {"key": "37806929", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.42493570663812325, "res": {"No": 0.5750026957125713, "Yes": 0.42493570663812325}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4630220740029868, "res": {"No": 0.536936790482591, "Yes": 0.4630220740029868}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5526576206678331, "res": {"Yes": 0.5526576206678331, "No": 0.4473253485576597}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6354439439705291, "res": {"Yes": 0.6354439439705291, "No": 0.3645374461092734}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7477492234411508, "res": {"Yes": 0.7477492234411508, "No": 0.25223365971080836}, "ground_truth": 1}, {"key": "32334186", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5868647878884841, "res": {"Yes": 0.5868647878884841, "No": 0.4131181291175491}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6045086921240381, "res": {"Yes": 0.6045086921240381, "No": 0.3954714822249819}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3504494869541228, "res": {"No": 0.6495378428374335, "Yes": 0.3504494869541228}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6041146386303581, "res": {"Yes": 0.6041146386303581, "No": 0.3958617281660507}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6314771004516934, "res": {"Yes": 0.6314771004516934, "No": 0.3685031570830107}, "ground_truth": 1}, {"key": "36187324", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6110552306703483, "res": {"Yes": 0.6110552306703483, "No": 0.38892187150336444}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6832710541087388, "res": {"Yes": 0.6832710541087388, "No": 0.3167074189229653}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4363398093274287, "res": {"No": 0.5636434321019048, "Yes": 0.4363398093274287}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5041012692717375, "res": {"Yes": 0.5041012692717375, "No": 0.49587995884800695}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.43289836560394146, "res": {"No": 0.5670871405647391, "Yes": 0.43289836560394146}, "ground_truth": 1}, {"key": "35306009", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.48160121603552764, "res": {"No": 0.5183725949610115, "Yes": 0.48160121603552764}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45673843693731403, "res": {"No": 0.5432382658428514, "Yes": 0.45673843693731403}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7351913819924836, "res": {"Yes": 0.7351913819924836, "No": 0.2647857686850614}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6052928127616155, "res": {"Yes": 0.6052928127616155, "No": 0.39468072186768494}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5929666031712199, "res": {"Yes": 0.5929666031712199, "No": 0.40700823920398865}, "ground_truth": 1}, {"key": "39490050", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6176698423245421, "res": {"Yes": 0.6176698423245421, "No": 0.38229003673418654}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.500859403008283, "res": {"Yes": 0.500859403008283, "No": 0.4991199357031692}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.8011086084754422, "res": {"Yes": 0.8011086084754422, "No": 0.19887119999727723}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5552786606389404, "res": {"Yes": 0.5552786606389404, "No": 0.44469723462630006}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6867402509708369, "res": {"Yes": 0.6867402509708369, "No": 0.313227442178025}, "ground_truth": 1}, {"key": "38072149", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4731607198210325, "res": {"No": 0.526807922664309, "Yes": 0.4731607198210325}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7260558418257155, "res": {"Yes": 0.7260558418257155, "No": 0.27391851700901226}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4355232487818476, "res": {"No": 0.5644523894768949, "Yes": 0.4355232487818476}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4182316388579721, "res": {"No": 0.5817390729758689, "Yes": 0.4182316388579721}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5290823966448638, "res": {"Yes": 0.5290823966448638, "No": 0.47087729927408034}, "ground_truth": 1}, {"key": "35899689", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4883807460620739, "res": {"No": 0.5115902332795703, "Yes": 0.4883807460620739}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6225124816505704, "res": {"Yes": 0.6225124816505704, "No": 0.3774627238261652}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.31113788653370655, "res": {"No": 0.6888493583306886, "Yes": 0.31113788653370655}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6804034962174594, "res": {"Yes": 0.6804034962174594, "No": 0.31956544195126896}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5374187463440816, "res": {"Yes": 0.5374187463440816, "No": 0.4625590150785632}, "ground_truth": 1}, {"key": "27994518", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5194573863539189, "res": {"Yes": 0.5194573863539189, "No": 0.48052217586145546}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5474539666524173, "res": {"Yes": 0.5474539666524173, "No": 0.4525241260617206}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5483618224305693, "res": {"Yes": 0.5483618224305693, "No": 0.4516133434898412}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6889051367213903, "res": {"Yes": 0.6889051367213903, "No": 0.31105983183034724}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6935321092574096, "res": {"Yes": 0.6935321092574096, "No": 0.30643218628826296}, "ground_truth": 1}, {"key": "10615479", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7321145193924326, "res": {"Yes": 0.7321145193924326, "No": 0.26785087229650706}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6655444842699823, "res": {"Yes": 0.6655444842699823, "No": 0.33442772216385674}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7152431672865203, "res": {"Yes": 0.7152431672865203, "No": 0.2847407676021407}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6496795614713335, "res": {"Yes": 0.6496795614713335, "No": 0.35029872097951215}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6774978158981809, "res": {"Yes": 0.6774978158981809, "No": 0.32248069661341455}, "ground_truth": 1}, {"key": "40186667", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6879652369598472, "res": {"Yes": 0.6879652369598472, "No": 0.31200829655617535}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4899695660051275, "res": {"No": 0.5100166534364136, "Yes": 0.4899695660051275}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3975821895887267, "res": {"No": 0.6024043990399254, "Yes": 0.3975821895887267}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.631485524412401, "res": {"Yes": 0.631485524412401, "No": 0.36849121777413907}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7680711399355161, "res": {"Yes": 0.7680711399355161, "No": 0.23189991529173445}, "ground_truth": 1}, {"key": "38622886", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7067923231593568, "res": {"Yes": 0.7067923231593568, "No": 0.29318463935228223}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7286830829200813, "res": {"Yes": 0.7286830829200813, "No": 0.2712972488467195}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.27822982449745237, "res": {"No": 0.7217585458875084, "Yes": 0.27822982449745237}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.288483525110724, "res": {"No": 0.7115007552236625, "Yes": 0.288483525110724}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5301989317155239, "res": {"Yes": 0.5301989317155239, "No": 0.469781286715299}, "ground_truth": 1}, {"key": "40686943", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4803680971075054, "res": {"No": 0.519609853884321, "Yes": 0.4803680971075054}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5097402228479456, "res": {"Yes": 0.5097402228479456, "No": 0.4902423099525739}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.26742195826917403, "res": {"No": 0.732549912852059, "Yes": 0.26742195826917403}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3255706793646384, "res": {"No": 0.6744032589072789, "Yes": 0.3255706793646384}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.25374047151778795, "res": {"No": 0.7462371752631629, "Yes": 0.25374047151778795}, "ground_truth": 1}, {"key": "30604567", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.18680666013413214, "res": {"No": 0.813177122751567, "Yes": 0.18680666013413214}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5204960394926305, "res": {"Yes": 0.5204960394926305, "No": 0.4794842173535669}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6928834124142358, "res": {"Yes": 0.6928834124142358, "No": 0.3070953172322118}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7468123202961462, "res": {"Yes": 0.7468123202961462, "No": 0.25316564023346455}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8484188145744196, "res": {"Yes": 0.8484188145744196, "No": 0.15156343936460237}, "ground_truth": 1}, {"key": "35440903", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8535816981539907, "res": {"Yes": 0.8535816981539907, "No": 0.14640153390743688}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7308779180142514, "res": {"Yes": 0.7308779180142514, "No": 0.26910121667093084}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5443942882966704, "res": {"Yes": 0.5443942882966704, "No": 0.45559387104081583}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6016373643383278, "res": {"Yes": 0.6016373643383278, "No": 0.3983397080260544}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6871551879892186, "res": {"Yes": 0.6871551879892186, "No": 0.3128176644120276}, "ground_truth": 1}, {"key": "37219533", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6920698424925219, "res": {"Yes": 0.6920698424925219, "No": 0.3079093984989524}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6592943121530338, "res": {"Yes": 0.6592943121530338, "No": 0.3406831202033581}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6868077265151766, "res": {"Yes": 0.6868077265151766, "No": 0.3131745738479979}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5605456750273147, "res": {"Yes": 0.5605456750273147, "No": 0.43943136946020134}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6498468105144847, "res": {"Yes": 0.6498468105144847, "No": 0.3501283771126146}, "ground_truth": 1}, {"key": "40178965", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6734522728553689, "res": {"Yes": 0.6734522728553689, "No": 0.32652913498157693}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7187088361170306, "res": {"Yes": 0.7187088361170306, "No": 0.28125779789471106}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.46266917737277685, "res": {"No": 0.5373089091780696, "Yes": 0.46266917737277685}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.47413954589123414, "res": {"No": 0.5258276139987776, "Yes": 0.47413954589123414}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4756791055951249, "res": {"No": 0.5242840140240459, "Yes": 0.4756791055951249}, "ground_truth": 1}, {"key": "13750468", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6580516205829179, "res": {"Yes": 0.6580516205829179, "No": 0.34191596106352673}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45833601805141816, "res": {"No": 0.5416363194969449, "Yes": 0.45833601805141816}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.37106634680678535, "res": {"No": 0.6289170292279649, "Yes": 0.37106634680678535}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8180425881349512, "res": {"Yes": 0.8180425881349512, "No": 0.18193561831682412}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7050597485814531, "res": {"Yes": 0.7050597485814531, "No": 0.294920603365851}, "ground_truth": 1}, {"key": "17754949", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6863247958269806, "res": {"Yes": 0.6863247958269806, "No": 0.3136571401476835}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7534246996626808, "res": {"Yes": 0.7534246996626808, "No": 0.24655581034268795}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6262332772084217, "res": {"Yes": 0.6262332772084217, "No": 0.3737512910383486}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4789043923154606, "res": {"No": 0.5210787484469503, "Yes": 0.4789043923154606}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4084989479839841, "res": {"No": 0.5914876943039329, "Yes": 0.4084989479839841}, "ground_truth": 1}, {"key": "36675623", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.2967172837784463, "res": {"No": 0.7032684898193217, "Yes": 0.2967172837784463}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.32539254328320744, "res": {"No": 0.6745950122652433, "Yes": 0.32539254328320744}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4971149459743795, "res": {"No": 0.5028721329730628, "Yes": 0.4971149459743795}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.12830281074514596, "res": {"No": 0.8716814251117548, "Yes": 0.12830281074514596}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.528187629235579, "res": {"Yes": 0.528187629235579, "No": 0.47179660871782797}, "ground_truth": 1}, {"key": "40035440", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.48006757679494894, "res": {"No": 0.519915073987247, "Yes": 0.48006757679494894}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.36109146033828854, "res": {"No": 0.6388957841516555, "Yes": 0.36109146033828854}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6348532304210728, "res": {"Yes": 0.6348532304210728, "No": 0.36511598819609287}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5245269868202098, "res": {"Yes": 0.5245269868202098, "No": 0.47542687229570146}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6603532367083883, "res": {"Yes": 0.6603532367083883, "No": 0.33961287941968477}, "ground_truth": 1}, {"key": "37685909", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7423665909032845, "res": {"Yes": 0.7423665909032845, "No": 0.2576067968017649}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.673085226940078, "res": {"Yes": 0.673085226940078, "No": 0.3268775967585787}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.45659772380282293, "res": {"No": 0.5433682565805088, "Yes": 0.45659772380282293}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6400134866242874, "res": {"Yes": 0.6400134866242874, "No": 0.35994407745547846}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6972819713708498, "res": {"Yes": 0.6972819713708498, "No": 0.30267798329704093}, "ground_truth": 1}, {"key": "36938787", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6627474376895204, "res": {"Yes": 0.6627474376895204, "No": 0.3372178224534957}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.617742404262762, "res": {"Yes": 0.617742404262762, "No": 0.3822270405271628}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6490547209752452, "res": {"Yes": 0.6490547209752452, "No": 0.3509270190744646}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7617247721081178, "res": {"Yes": 0.7617247721081178, "No": 0.238251581138941}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.836364036767283, "res": {"Yes": 0.836364036767283, "No": 0.16362124562688063}, "ground_truth": 1}, {"key": "39398068", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.717425133748613, "res": {"Yes": 0.717425133748613, "No": 0.28255185152973716}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7718524840907536, "res": {"Yes": 0.7718524840907536, "No": 0.22812914156607178}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.39251609352060113, "res": {"No": 0.6074667425740836, "Yes": 0.39251609352060113}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.825362380498505, "res": {"Yes": 0.825362380498505, "No": 0.17461519707301393}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.856105100002959, "res": {"Yes": 0.856105100002959, "No": 0.14387707353282228}, "ground_truth": 1}, {"key": "39926408", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8322100883501367, "res": {"Yes": 0.8322100883501367, "No": 0.1677698297470615}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7391343313946135, "res": {"Yes": 0.7391343313946135, "No": 0.26084693490366606}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6233723039811733, "res": {"Yes": 0.6233723039811733, "No": 0.37657942417717966}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5819593960043684, "res": {"Yes": 0.5819593960043684, "No": 0.41800318369130934}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5714667200935905, "res": {"Yes": 0.5714667200935905, "No": 0.42849153332828066}, "ground_truth": 1}, {"key": "40465336", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5285257035205931, "res": {"Yes": 0.5285257035205931, "No": 0.47143902810503857}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.35226491042519265, "res": {"No": 0.6477129235531283, "Yes": 0.35226491042519265}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.36927770127699, "res": {"No": 0.6306764156115818, "Yes": 0.36927770127699}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6084239097362208, "res": {"Yes": 0.6084239097362208, "No": 0.39154587221754933}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6546657362130549, "res": {"Yes": 0.6546657362130549, "No": 0.34531114459445417}, "ground_truth": 1}, {"key": "34173549", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.635249807380708, "res": {"Yes": 0.635249807380708, "No": 0.36472716429338975}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6305654389410861, "res": {"Yes": 0.6305654389410861, "No": 0.36940360211712137}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7188059546161447, "res": {"Yes": 0.7188059546161447, "No": 0.2811745579066602}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6406785435323061, "res": {"Yes": 0.6406785435323061, "No": 0.3593003897913666}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6617918489869391, "res": {"Yes": 0.6617918489869391, "No": 0.33817853936039793}, "ground_truth": 1}, {"key": "33541535", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6377107298142308, "res": {"Yes": 0.6377107298142308, "No": 0.3622688004591391}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6556868938109134, "res": {"Yes": 0.6556868938109134, "No": 0.3442958025395324}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6255558715766812, "res": {"Yes": 0.6255558715766812, "No": 0.37440738862429}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6569959203695411, "res": {"Yes": 0.6569959203695411, "No": 0.3429703083981482}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5599969733498268, "res": {"Yes": 0.5599969733498268, "No": 0.4399668921563893}, "ground_truth": 1}, {"key": "35685195", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5888658972181884, "res": {"Yes": 0.5888658972181884, "No": 0.41109464960050845}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5103560804138089, "res": {"Yes": 0.5103560804138089, "No": 0.48960785705810056}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3864338951977191, "res": {"No": 0.6135502138587677, "Yes": 0.3864338951977191}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.596910949519144, "res": {"Yes": 0.596910949519144, "No": 0.40306441141217136}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6680644153031755, "res": {"Yes": 0.6680644153031755, "No": 0.33190898142055464}, "ground_truth": 1}, {"key": "28440730", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4731280539325755, "res": {"No": 0.5268569707650628, "Yes": 0.4731280539325755}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.686008390693103, "res": {"Yes": 0.686008390693103, "No": 0.31396432945144853}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.47350836509345806, "res": {"No": 0.5264433766054193, "Yes": 0.47350836509345806}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5088132630401899, "res": {"Yes": 0.5088132630401899, "No": 0.4911246076421197}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.43886362647947863, "res": {"No": 0.5610849830469218, "Yes": 0.43886362647947863}, "ground_truth": 1}, {"key": "38338714", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4258364017172963, "res": {"No": 0.574098709314737, "Yes": 0.4258364017172963}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5307296611998582, "res": {"Yes": 0.5307296611998582, "No": 0.4692274781901454}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.2528853892020137, "res": {"No": 0.7470620587431355, "Yes": 0.2528853892020137}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5523671428149471, "res": {"Yes": 0.5523671428149471, "No": 0.447597064892482}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7049488302568276, "res": {"Yes": 0.7049488302568276, "No": 0.29499233677901915}, "ground_truth": 1}, {"key": "32191881", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5659460632109958, "res": {"Yes": 0.5659460632109958, "No": 0.43399791458368214}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6781845570807079, "res": {"Yes": 0.6781845570807079, "No": 0.3217656478892686}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.36464718839593785, "res": {"No": 0.6353189326729425, "Yes": 0.36464718839593785}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5492568479364806, "res": {"Yes": 0.5492568479364806, "No": 0.45071841114902894}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6694298962087477, "res": {"Yes": 0.6694298962087477, "No": 0.33054783331880394}, "ground_truth": 1}, {"key": "37707251", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.46396089886234215, "res": {"No": 0.5360148034048942, "Yes": 0.46396089886234215}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7058352398792912, "res": {"Yes": 0.7058352398792912, "No": 0.2941410690567051}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.46988714506203305, "res": {"No": 0.5300918688523005, "Yes": 0.46988714506203305}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6250630527088861, "res": {"Yes": 0.6250630527088861, "No": 0.37491105417954423}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.46233904195331665, "res": {"No": 0.5376428966934068, "Yes": 0.46233904195331665}, "ground_truth": 1}, {"key": "40172567", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5132092100933475, "res": {"Yes": 0.5132092100933475, "No": 0.4867640355070978}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6570476739764778, "res": {"Yes": 0.6570476739764778, "No": 0.3429299774613861}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5674282155785576, "res": {"Yes": 0.5674282155785576, "No": 0.4325502648745624}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.630760685917024, "res": {"Yes": 0.630760685917024, "No": 0.36921151048911666}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6348163719125274, "res": {"Yes": 0.6348163719125274, "No": 0.3651518808618282}, "ground_truth": 1}, {"key": "33113255", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7410148895709558, "res": {"Yes": 0.7410148895709558, "No": 0.25895685866959306}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6379378845605916, "res": {"Yes": 0.6379378845605916, "No": 0.36203785528978}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.49520986825166396, "res": {"No": 0.5047767129799369, "Yes": 0.49520986825166396}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6041522761447412, "res": {"Yes": 0.6041522761447412, "No": 0.39582749948231466}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8181558048825753, "res": {"Yes": 0.8181558048825753, "No": 0.18182758064990764}, "ground_truth": 1}, {"key": "33022143", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7249134214123747, "res": {"Yes": 0.7249134214123747, "No": 0.2750710640421956}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8368562312271197, "res": {"Yes": 0.8368562312271197, "No": 0.16312684347057377}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4619814916807275, "res": {"No": 0.5380033457357529, "Yes": 0.4619814916807275}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5412683809810223, "res": {"Yes": 0.5412683809810223, "No": 0.4587135948672093}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6846748807726797, "res": {"Yes": 0.6846748807726797, "No": 0.31530372448153027}, "ground_truth": 1}, {"key": "32084473", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6326057618169979, "res": {"Yes": 0.6326057618169979, "No": 0.3673741382285533}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6473131231246992, "res": {"Yes": 0.6473131231246992, "No": 0.3526637942901835}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.40027175702272055, "res": {"No": 0.5996986259735356, "Yes": 0.40027175702272055}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.40321462119420814, "res": {"No": 0.5967554386629714, "Yes": 0.40321462119420814}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.37272078698926947, "res": {"No": 0.6272367236011649, "Yes": 0.37272078698926947}, "ground_truth": 1}, {"key": "40564245", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5672885830036128, "res": {"Yes": 0.5672885830036128, "No": 0.4326591558056272}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5814430198759891, "res": {"Yes": 0.5814430198759891, "No": 0.4185182173050042}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6307703050908303, "res": {"Yes": 0.6307703050908303, "No": 0.3692192640122486}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7308549980421295, "res": {"Yes": 0.7308549980421295, "No": 0.2691276706207199}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.785860486813703, "res": {"Yes": 0.785860486813703, "No": 0.21412761712408643}, "ground_truth": 1}, {"key": "31717213", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7923254974252327, "res": {"Yes": 0.7923254974252327, "No": 0.20765621067707782}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7962913121904243, "res": {"Yes": 0.7962913121904243, "No": 0.20369595776625574}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5917993543560375, "res": {"Yes": 0.5917993543560375, "No": 0.4081782143784991}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5318207087873164, "res": {"Yes": 0.5318207087873164, "No": 0.4681624817931389}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.33385580526070957, "res": {"No": 0.6661307875624048, "Yes": 0.33385580526070957}, "ground_truth": 1}, {"key": "34861894", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6607703484384493, "res": {"Yes": 0.6607703484384493, "No": 0.33921413647640797}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5139847208199627, "res": {"Yes": 0.5139847208199627, "No": 0.48599927833021445}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7343968565366764, "res": {"Yes": 0.7343968565366764, "No": 0.2655855149374916}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7482474052600592, "res": {"Yes": 0.7482474052600592, "No": 0.251735310157387}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7303872982363308, "res": {"Yes": 0.7303872982363308, "No": 0.269597977992481}, "ground_truth": 1}, {"key": "40838760", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7091690971287586, "res": {"Yes": 0.7091690971287586, "No": 0.2908098970586762}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6616058454422119, "res": {"Yes": 0.6616058454422119, "No": 0.3383744014312854}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.31733689791390524, "res": {"No": 0.6826458739744112, "Yes": 0.31733689791390524}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7722385299975972, "res": {"Yes": 0.7722385299975972, "No": 0.2277257556727953}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5439649850035823, "res": {"Yes": 0.5439649850035823, "No": 0.4560141222959733}, "ground_truth": 1}, {"key": "40044849", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7525404196357347, "res": {"Yes": 0.7525404196357347, "No": 0.24743315852836278}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6639549886374755, "res": {"Yes": 0.6639549886374755, "No": 0.3360232247929896}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5654034340932136, "res": {"Yes": 0.5654034340932136, "No": 0.4345769716601804}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5630063905605666, "res": {"Yes": 0.5630063905605666, "No": 0.4369561902745541}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.732706350936468, "res": {"Yes": 0.732706350936468, "No": 0.26726027036816263}, "ground_truth": 1}, {"key": "30296116", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7996580341600997, "res": {"Yes": 0.7996580341600997, "No": 0.20031547103042097}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5214633682799142, "res": {"Yes": 0.5214633682799142, "No": 0.4784970419647909}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.29256324893809416, "res": {"No": 0.7074162931735225, "Yes": 0.29256324893809416}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4683546176385627, "res": {"No": 0.5316159759592984, "Yes": 0.4683546176385627}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.40932670994098663, "res": {"No": 0.5906447748896325, "Yes": 0.40932670994098663}, "ground_truth": 1}, {"key": "34931360", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6160741988647163, "res": {"Yes": 0.6160741988647163, "No": 0.38389598710482375}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45779382041177624, "res": {"No": 0.5421897210251426, "Yes": 0.45779382041177624}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.49871225142915737, "res": {"No": 0.501273790070669, "Yes": 0.49871225142915737}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7009556364790857, "res": {"Yes": 0.7009556364790857, "No": 0.2990284678269704}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7702414514319416, "res": {"Yes": 0.7702414514319416, "No": 0.2297415264584844}, "ground_truth": 1}, {"key": "18862422", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8419989683315523, "res": {"Yes": 0.8419989683315523, "No": 0.1579889002508226}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7475176963131464, "res": {"Yes": 0.7475176963131464, "No": 0.25246834612660773}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.569501250677419, "res": {"Yes": 0.569501250677419, "No": 0.43047694954385085}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6606795714363463, "res": {"Yes": 0.6606795714363463, "No": 0.33929630409035894}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6330493612629218, "res": {"Yes": 0.6330493612629218, "No": 0.3669193536125325}, "ground_truth": 1}, {"key": "36361140", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5833599343672428, "res": {"Yes": 0.5833599343672428, "No": 0.4166056866934956}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5010610445052249, "res": {"Yes": 0.5010610445052249, "No": 0.4989010497441504}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4723185627371897, "res": {"No": 0.5276526350194667, "Yes": 0.4723185627371897}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6103477330827234, "res": {"Yes": 0.6103477330827234, "No": 0.3896187430213134}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5484009165383833, "res": {"Yes": 0.5484009165383833, "No": 0.4515800608129078}, "ground_truth": 1}, {"key": "39703329", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6146621756417924, "res": {"Yes": 0.6146621756417924, "No": 0.38531176236750075}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6419780281135697, "res": {"Yes": 0.6419780281135697, "No": 0.35800085654517905}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5590700168018787, "res": {"Yes": 0.5590700168018787, "No": 0.44090980423399034}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.3314183183064364, "res": {"No": 0.6685621081661884, "Yes": 0.3314183183064364}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4704726976568144, "res": {"No": 0.5295057260125482, "Yes": 0.4704726976568144}, "ground_truth": 1}, {"key": "34033324", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4724116895215045, "res": {"No": 0.5275684811356317, "Yes": 0.4724116895215045}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.37780697573138367, "res": {"No": 0.6221729190348335, "Yes": 0.37780697573138367}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5048111904068241, "res": {"Yes": 0.5048111904068241, "No": 0.4951643556042387}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5838356424061506, "res": {"Yes": 0.5838356424061506, "No": 0.41613662381815003}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4912338459017035, "res": {"No": 0.5087439979175435, "Yes": 0.4912338459017035}, "ground_truth": 1}, {"key": "35658862", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4552422655386576, "res": {"No": 0.5447362208087698, "Yes": 0.4552422655386576}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.39575394969217625, "res": {"No": 0.6042301261809033, "Yes": 0.39575394969217625}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5622163155672983, "res": {"Yes": 0.5622163155672983, "No": 0.4377684943722016}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7070459657456653, "res": {"Yes": 0.7070459657456653, "No": 0.29292364535035514}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6735636373954952, "res": {"Yes": 0.6735636373954952, "No": 0.326413107146372}, "ground_truth": 1}, {"key": "36092657", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6428444801612387, "res": {"Yes": 0.6428444801612387, "No": 0.35712254242819824}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6176776744277982, "res": {"Yes": 0.6176776744277982, "No": 0.3823043728793651}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6119656166454225, "res": {"Yes": 0.6119656166454225, "No": 0.38801531441346215}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5454843845817726, "res": {"Yes": 0.5454843845817726, "No": 0.45448534959433884}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.668838481994211, "res": {"Yes": 0.668838481994211, "No": 0.33113759338345217}, "ground_truth": 1}, {"key": "26333438", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6195739962059545, "res": {"Yes": 0.6195739962059545, "No": 0.38040456418484825}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7355516772662181, "res": {"Yes": 0.7355516772662181, "No": 0.26442688318021457}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6125991696723916, "res": {"Yes": 0.6125991696723916, "No": 0.3873871261406933}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5587048453562775, "res": {"Yes": 0.5587048453562775, "No": 0.441275315562835}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6880305761209823, "res": {"Yes": 0.6880305761209823, "No": 0.3119415339245687}, "ground_truth": 1}, {"key": "34184963", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8090749184249707, "res": {"Yes": 0.8090749184249707, "No": 0.1909044381425974}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6179415038307305, "res": {"Yes": 0.6179415038307305, "No": 0.3820396805442455}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6296875468531813, "res": {"Yes": 0.6296875468531813, "No": 0.37029847846359565}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7551999729267195, "res": {"Yes": 0.7551999729267195, "No": 0.2447813049324986}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6287590651113465, "res": {"Yes": 0.6287590651113465, "No": 0.37122586540073316}, "ground_truth": 1}, {"key": "35069975", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6773145030184886, "res": {"Yes": 0.6773145030184886, "No": 0.32267088729484106}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6552753827658118, "res": {"Yes": 0.6552753827658118, "No": 0.3447089986692834}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3337694479346904, "res": {"No": 0.6662151250585612, "Yes": 0.3337694479346904}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.46468517300308726, "res": {"No": 0.5352881922595041, "Yes": 0.46468517300308726}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6775469972496526, "res": {"Yes": 0.6775469972496526, "No": 0.3224266211349481}, "ground_truth": 1}, {"key": "36443950", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6302159629532456, "res": {"Yes": 0.6302159629532456, "No": 0.36975420681433774}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.08761262240838875, "res": {"No": 0.9123196471674516, "Yes": 0.08761262240838875}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4540209212291495, "res": {"No": 0.5459496082930602, "Yes": 0.4540209212291495}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.45276737788297633, "res": {"No": 0.5472073394643222, "Yes": 0.45276737788297633}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6552522650581065, "res": {"Yes": 0.6552522650581065, "No": 0.344717237312803}, "ground_truth": 1}, {"key": "29460858", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4781413399148409, "res": {"No": 0.5218236674433773, "Yes": 0.4781413399148409}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5065450325328922, "res": {"Yes": 0.5065450325328922, "No": 0.4934189345324899}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5354071197407955, "res": {"Yes": 0.5354071197407955, "No": 0.4645739174590132}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7737599233944861, "res": {"Yes": 0.7737599233944861, "No": 0.22622178757010777}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7535224854653865, "res": {"Yes": 0.7535224854653865, "No": 0.24645851396704857}, "ground_truth": 1}, {"key": "36155704", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7220011985854773, "res": {"Yes": 0.7220011985854773, "No": 0.27798539573465575}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8159425752193988, "res": {"Yes": 0.8159425752193988, "No": 0.1840417030578835}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.34859363667749965, "res": {"No": 0.6513841621441391, "Yes": 0.34859363667749965}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6856692365482908, "res": {"Yes": 0.6856692365482908, "No": 0.3143153178398945}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6342735821722624, "res": {"Yes": 0.6342735821722624, "No": 0.3657098571473047}, "ground_truth": 1}, {"key": "37185211", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6490944897763041, "res": {"Yes": 0.6490944897763041, "No": 0.35089164741370354}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6904240119861558, "res": {"Yes": 0.6904240119861558, "No": 0.30955688725979724}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4765438189952514, "res": {"No": 0.5234359006541592, "Yes": 0.4765438189952514}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5391351324180819, "res": {"Yes": 0.5391351324180819, "No": 0.460844243347749}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7290316954026712, "res": {"Yes": 0.7290316954026712, "No": 0.27094704042118906}, "ground_truth": 1}, {"key": "36454885", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6243869441453302, "res": {"Yes": 0.6243869441453302, "No": 0.37558427457620086}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6878714530520178, "res": {"Yes": 0.6878714530520178, "No": 0.3121020691379152}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.537665585702382, "res": {"Yes": 0.537665585702382, "No": 0.4623003642869762}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6240361123072413, "res": {"Yes": 0.6240361123072413, "No": 0.3759364145997563}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.45658650533456857, "res": {"No": 0.5433652680633161, "Yes": 0.45658650533456857}, "ground_truth": 1}, {"key": "33148906", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5428262998515506, "res": {"Yes": 0.5428262998515506, "No": 0.45712125273892756}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6651037469789453, "res": {"Yes": 0.6651037469789453, "No": 0.3348596132214327}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3336697992558253, "res": {"No": 0.6662957219770458, "Yes": 0.3336697992558253}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5466115910427298, "res": {"Yes": 0.5466115910427298, "No": 0.45335058703879416}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5650774938411032, "res": {"Yes": 0.5650774938411032, "No": 0.4348760504461934}, "ground_truth": 1}, {"key": "18086604", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.39401407380693054, "res": {"No": 0.6059427920056331, "Yes": 0.39401407380693054}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.28330956781042904, "res": {"No": 0.7166539721245516, "Yes": 0.28330956781042904}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6262315801185401, "res": {"Yes": 0.6262315801185401, "No": 0.3737495717863641}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5483589161206122, "res": {"Yes": 0.5483589161206122, "No": 0.4516238662033337}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.40005304026593846, "res": {"No": 0.5999256488667175, "Yes": 0.40005304026593846}, "ground_truth": 1}, {"key": "33693397", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5212435395993175, "res": {"Yes": 0.5212435395993175, "No": 0.47873524921553406}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.34529829925879996, "res": {"No": 0.6546838576114322, "Yes": 0.34529829925879996}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5035522996616952, "res": {"Yes": 0.5035522996616952, "No": 0.49642483335464355}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.547154892154412, "res": {"Yes": 0.547154892154412, "No": 0.4528206989088762}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6451746781590048, "res": {"Yes": 0.6451746781590048, "No": 0.35480529668790944}, "ground_truth": 1}, {"key": "39501530", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.560753423715457, "res": {"Yes": 0.560753423715457, "No": 0.4392263039428174}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5791089209596649, "res": {"Yes": 0.5791089209596649, "No": 0.4208717599066626}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4066634377148165, "res": {"No": 0.5933112524669214, "Yes": 0.4066634377148165}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6824254968542193, "res": {"Yes": 0.6824254968542193, "No": 0.31754564728724477}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6671841861713776, "res": {"Yes": 0.6671841861713776, "No": 0.33279057192122496}, "ground_truth": 1}, {"key": "30948874", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8028425110392446, "res": {"Yes": 0.8028425110392446, "No": 0.19713302979394298}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6550187158095951, "res": {"Yes": 0.6550187158095951, "No": 0.3449527941028733}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.48883940919436397, "res": {"No": 0.5111407430444171, "Yes": 0.48883940919436397}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6778221100672774, "res": {"Yes": 0.6778221100672774, "No": 0.3221585381826449}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6004427375263811, "res": {"Yes": 0.6004427375263811, "No": 0.39953427208840875}, "ground_truth": 1}, {"key": "39410675", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.589822732864136, "res": {"Yes": 0.589822732864136, "No": 0.41015341760280366}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5107946850636245, "res": {"Yes": 0.5107946850636245, "No": 0.4891788304107919}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.10735434289531079, "res": {"No": 0.8926377941865593, "Yes": 0.10735434289531079}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.712286564722562, "res": {"Yes": 0.712286564722562, "No": 0.2876860493120156}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7173629787276194, "res": {"Yes": 0.7173629787276194, "No": 0.2826108827771209}, "ground_truth": 1}, {"key": "32903337", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6215678827134379, "res": {"Yes": 0.6215678827134379, "No": 0.37841129230728077}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6906147748725713, "res": {"Yes": 0.6906147748725713, "No": 0.30936257750021984}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.35717050720640914, "res": {"No": 0.642808231183052, "Yes": 0.35717050720640914}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6039342769286054, "res": {"Yes": 0.6039342769286054, "No": 0.3960448288373654}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.508073782910725, "res": {"Yes": 0.508073782910725, "No": 0.4919097078312492}, "ground_truth": 1}, {"key": "27685132", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.46373377138076466, "res": {"No": 0.5362523266543243, "Yes": 0.46373377138076466}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.45423137690664545, "res": {"No": 0.5457496635736534, "Yes": 0.45423137690664545}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5444731985233021, "res": {"Yes": 0.5444731985233021, "No": 0.45550350840301884}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6288547506583347, "res": {"Yes": 0.6288547506583347, "No": 0.37110675813230937}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5931623144408498, "res": {"Yes": 0.5931623144408498, "No": 0.4068126821094656}, "ground_truth": 1}, {"key": "22791471", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.625598342006445, "res": {"Yes": 0.625598342006445, "No": 0.3743706984980504}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.03511950868219529, "res": {"No": 0.964829024523862, "Yes": 0.03511950868219529}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.45725015624745546, "res": {"No": 0.5427287844385911, "Yes": 0.45725015624745546}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.661635155230372, "res": {"Yes": 0.661635155230372, "No": 0.33834036267867934}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6587953098077913, "res": {"Yes": 0.6587953098077913, "No": 0.3411818702616869}, "ground_truth": 1}, {"key": "32292348", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7433791264529079, "res": {"Yes": 0.7433791264529079, "No": 0.2565959526289543}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.701477187197839, "res": {"Yes": 0.701477187197839, "No": 0.29849789443304603}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.523276067737828, "res": {"Yes": 0.523276067737828, "No": 0.47671278372631426}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7818332472392071, "res": {"Yes": 0.7818332472392071, "No": 0.21814373469381299}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8610308024423123, "res": {"Yes": 0.8610308024423123, "No": 0.13895496377083344}, "ground_truth": 1}, {"key": "20482930", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7805265288861435, "res": {"Yes": 0.7805265288861435, "No": 0.21945539038317163}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7195540168026342, "res": {"Yes": 0.7195540168026342, "No": 0.2804254401136}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4332630021950166, "res": {"No": 0.5667221106889099, "Yes": 0.4332630021950166}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7017365010844816, "res": {"Yes": 0.7017365010844816, "No": 0.29824568077600183}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5840194160766365, "res": {"Yes": 0.5840194160766365, "No": 0.4159580771004407}, "ground_truth": 1}, {"key": "11635754", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7128614979228047, "res": {"Yes": 0.7128614979228047, "No": 0.28711544405698314}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.635322318931878, "res": {"Yes": 0.635322318931878, "No": 0.36465542951551994}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.3289170788347978, "res": {"No": 0.6710676012941035, "Yes": 0.3289170788347978}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.49206469855858986, "res": {"No": 0.5079188948282036, "Yes": 0.49206469855858986}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6399979664854191, "res": {"Yes": 0.6399979664854191, "No": 0.3599793177056434}, "ground_truth": 1}, {"key": "40029096", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7428345777760469, "res": {"Yes": 0.7428345777760469, "No": 0.2571519560860854}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6687716081778086, "res": {"Yes": 0.6687716081778086, "No": 0.3312086962573719}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5687433221844838, "res": {"Yes": 0.5687433221844838, "No": 0.43123857661331955}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5397149765360579, "res": {"Yes": 0.5397149765360579, "No": 0.46026585996769087}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6866013580676804, "res": {"Yes": 0.6866013580676804, "No": 0.31337444297758565}, "ground_truth": 1}, {"key": "40414719", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6435225434520907, "res": {"Yes": 0.6435225434520907, "No": 0.3564560958527479}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6226819214779303, "res": {"Yes": 0.6226819214779303, "No": 0.3772955071428299}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6790743215837438, "res": {"Yes": 0.6790743215837438, "No": 0.32089930392575894}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5894752468279861, "res": {"Yes": 0.5894752468279861, "No": 0.4104977915527437}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.48499412573723155, "res": {"No": 0.5149753724228472, "Yes": 0.48499412573723155}, "ground_truth": 1}, {"key": "39537616", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5338949672025555, "res": {"Yes": 0.5338949672025555, "No": 0.46607577536330014}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6380319809581537, "res": {"Yes": 0.6380319809581537, "No": 0.3619311060672016}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.08821947811896104, "res": {"No": 0.9117577984985609, "Yes": 0.08821947811896104}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5781982361457076, "res": {"Yes": 0.5781982361457076, "No": 0.42171540001862096}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5323770500409941, "res": {"Yes": 0.5323770500409941, "No": 0.4675451300716359}, "ground_truth": 1}, {"key": "33245830", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.40796623718486125, "res": {"No": 0.5919897609146411, "Yes": 0.40796623718486125}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.2910264565394853, "res": {"No": 0.7089246532209632, "Yes": 0.2910264565394853}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.10201239025366249, "res": {"No": 0.8979638837768736, "Yes": 0.10201239025366249}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.4242284804084614, "res": {"No": 0.5757486126061545, "Yes": 0.4242284804084614}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5799035745724574, "res": {"Yes": 0.5799035745724574, "No": 0.4200577194017267}, "ground_truth": 1}, {"key": "39243601", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5037960124708359, "res": {"Yes": 0.5037960124708359, "No": 0.4961585232464576}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.37243350394394814, "res": {"No": 0.6275164143447464, "Yes": 0.37243350394394814}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.06435913480519344, "res": {"No": 0.935625985969858, "Yes": 0.06435913480519344}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5596860933543448, "res": {"Yes": 0.5596860933543448, "No": 0.44029751945384227}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5385799637011498, "res": {"Yes": 0.5385799637011498, "No": 0.4614034758511742}, "ground_truth": 1}, {"key": "35815905", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5996686657785938, "res": {"Yes": 0.5996686657785938, "No": 0.40030596971185173}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.48519536243798295, "res": {"No": 0.5147882849636317, "Yes": 0.48519536243798295}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.21692892796217525, "res": {"No": 0.7830573043790419, "Yes": 0.21692892796217525}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6386858966471137, "res": {"Yes": 0.6386858966471137, "No": 0.3612938004445422}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5450504226361687, "res": {"Yes": 0.5450504226361687, "No": 0.45492136461005483}, "ground_truth": 1}, {"key": "35260212", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6113204739703353, "res": {"Yes": 0.6113204739703353, "No": 0.38865823297904184}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6685220825509512, "res": {"Yes": 0.6685220825509512, "No": 0.33145789201614567}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.581089290368206, "res": {"Yes": 0.581089290368206, "No": 0.4188919199280384}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5753196037464432, "res": {"Yes": 0.5753196037464432, "No": 0.42466014023485343}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7223705822166467, "res": {"Yes": 0.7223705822166467, "No": 0.2776045111336714}, "ground_truth": 1}, {"key": "39193924", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7373980777349808, "res": {"Yes": 0.7373980777349808, "No": 0.26258007391002386}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5850323992210686, "res": {"Yes": 0.5850323992210686, "No": 0.41494981241678275}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.22634192060362082, "res": {"No": 0.7736351105113219, "Yes": 0.22634192060362082}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.43966878363727574, "res": {"No": 0.5602989491084117, "Yes": 0.43966878363727574}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3995682459319419, "res": {"No": 0.6003975859302404, "Yes": 0.3995682459319419}, "ground_truth": 1}, {"key": "40658569", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4174841289102613, "res": {"No": 0.5824941712675414, "Yes": 0.4174841289102613}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.31091957547637694, "res": {"No": 0.6890570225997864, "Yes": 0.31091957547637694}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.4153938220261089, "res": {"No": 0.5845870374016129, "Yes": 0.4153938220261089}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6062885203665479, "res": {"Yes": 0.6062885203665479, "No": 0.3936873549655475}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6442734507722402, "res": {"Yes": 0.6442734507722402, "No": 0.3557018496546718}, "ground_truth": 1}, {"key": "33497596", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5105100270216433, "res": {"Yes": 0.5105100270216433, "No": 0.48946885753786323}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5492487189952854, "res": {"Yes": 0.5492487189952854, "No": 0.4507280881771989}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5569053119527834, "res": {"Yes": 0.5569053119527834, "No": 0.4430662817171366}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6759957972799452, "res": {"Yes": 0.6759957972799452, "No": 0.3239846308380326}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4905331343826816, "res": {"No": 0.5094417808862323, "Yes": 0.4905331343826816}, "ground_truth": 1}, {"key": "40339241", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6027025063290259, "res": {"Yes": 0.6027025063290259, "No": 0.3972777344069277}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6005169568353982, "res": {"Yes": 0.6005169568353982, "No": 0.3994617352360831}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5068319955651536, "res": {"Yes": 0.5068319955651536, "No": 0.4931422534545728}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.8582077808409606, "res": {"Yes": 0.8582077808409606, "No": 0.1417675832465121}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8020744941142239, "res": {"Yes": 0.8020744941142239, "No": 0.1979069516314309}, "ground_truth": 1}, {"key": "31792608", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7584186174630511, "res": {"Yes": 0.7584186174630511, "No": 0.24155362037411576}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.8556272784805782, "res": {"Yes": 0.8556272784805782, "No": 0.14435269545441126}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6020130838135154, "res": {"Yes": 0.6020130838135154, "No": 0.3979685885712946}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6901053167962676, "res": {"Yes": 0.6901053167962676, "No": 0.3098728583456251}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5337104316112083, "res": {"Yes": 0.5337104316112083, "No": 0.4662773920708493}, "ground_truth": 1}, {"key": "33132662", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6963675283828189, "res": {"Yes": 0.6963675283828189, "No": 0.30361121320572704}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.613557324946955, "res": {"Yes": 0.613557324946955, "No": 0.38641923417385665}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.23837605244262122, "res": {"No": 0.7616097451189406, "Yes": 0.23837605244262122}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7530431189047373, "res": {"Yes": 0.7530431189047373, "No": 0.24693157624057802}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8259269232636802, "res": {"Yes": 0.8259269232636802, "No": 0.17404741793948497}, "ground_truth": 1}, {"key": "37577457", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7559310882997151, "res": {"Yes": 0.7559310882997151, "No": 0.24404720726616289}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7334098594154296, "res": {"Yes": 0.7334098594154296, "No": 0.2665644036085491}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.31681442076067035, "res": {"No": 0.6831408487189125, "Yes": 0.31681442076067035}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.29366124613339145, "res": {"No": 0.7062958770332899, "Yes": 0.29366124613339145}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.3260344918471754, "res": {"No": 0.673917647670563, "Yes": 0.3260344918471754}, "ground_truth": 1}, {"key": "38701278", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3362582543885364, "res": {"No": 0.6636987116468925, "Yes": 0.3362582543885364}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.2897213442039683, "res": {"No": 0.7102192669029704, "Yes": 0.2897213442039683}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.53003448951321, "res": {"Yes": 0.53003448951321, "No": 0.4699483142528162}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7263006728228533, "res": {"Yes": 0.7263006728228533, "No": 0.2736656152954892}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6947232876258231, "res": {"Yes": 0.6947232876258231, "No": 0.3052542631486208}, "ground_truth": 1}, {"key": "34570783", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6219637609988401, "res": {"Yes": 0.6219637609988401, "No": 0.37801005998490805}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.7332583159267517, "res": {"Yes": 0.7332583159267517, "No": 0.26671988263779894}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6126683482763815, "res": {"Yes": 0.6126683482763815, "No": 0.38731710062582664}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7754933279101812, "res": {"Yes": 0.7754933279101812, "No": 0.22449393225106193}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7414007030443789, "res": {"Yes": 0.7414007030443789, "No": 0.25858518591417057}, "ground_truth": 1}, {"key": "39064526", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7792790356567434, "res": {"Yes": 0.7792790356567434, "No": 0.2207102331515137}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.6830692251558551, "res": {"Yes": 0.6830692251558551, "No": 0.3169117294102643}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.459837781779255, "res": {"No": 0.5401322024690841, "Yes": 0.459837781779255}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5042344199987316, "res": {"Yes": 0.5042344199987316, "No": 0.49571775825287884}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5447522907643144, "res": {"Yes": 0.5447522907643144, "No": 0.4552166133597514}, "ground_truth": 1}, {"key": "40741545", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.32151547587284973, "res": {"No": 0.6784565093452409, "Yes": 0.32151547587284973}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.40978710919682587, "res": {"No": 0.5901823630060696, "Yes": 0.40978710919682587}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6117035373083817, "res": {"Yes": 0.6117035373083817, "No": 0.38824661329190574}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.6607499507726325, "res": {"Yes": 0.6607499507726325, "No": 0.3392010769835505}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5174194076396903, "res": {"Yes": 0.5174194076396903, "No": 0.482521620442377}, "ground_truth": 1}, {"key": "36929751", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6549970153990097, "res": {"Yes": 0.6549970153990097, "No": 0.3449525181407484}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.5855384076851061, "res": {"Yes": 0.5855384076851061, "No": 0.41440902906083876}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.6211077820695763, "res": {"Yes": 0.6211077820695763, "No": 0.3788675300241706}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.5669572924777231, "res": {"Yes": 0.5669572924777231, "No": 0.4330081365706341}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8281289168811404, "res": {"Yes": 0.8281289168811404, "No": 0.17184619797874837}, "ground_truth": 1}, {"key": "23984730", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6085733935142273, "res": {"Yes": 0.6085733935142273, "No": 0.391394882094952}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.4806123302778669, "res": {"No": 0.5193586468902565, "Yes": 0.4806123302778669}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.5898202792066708, "res": {"Yes": 0.5898202792066708, "No": 0.41015091567458717}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.47007203032965234, "res": {"No": 0.5299051079868837, "Yes": 0.47007203032965234}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5624259488829639, "res": {"Yes": 0.5624259488829639, "No": 0.43754850970736786}, "ground_truth": 1}, {"key": "36007415", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7000770349956521, "res": {"Yes": 0.7000770349956521, "No": 0.29989232062715176}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.40232958624049164, "res": {"No": 0.5976449682015239, "Yes": 0.40232958624049164}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_readability_ft_gpt35", "target_model": "human", "recognition_score": 0.7397586238351869, "res": {"Yes": 0.7397586238351869, "No": 0.26022162687627487}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_readability_ft_gpt35", "target_model": "claude", "recognition_score": 0.7299211969866537, "res": {"Yes": 0.7299211969866537, "No": 0.2700525525093342}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_readability_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8341202686548661, "res": {"Yes": 0.8341202686548661, "No": 0.16585195929532132}, "ground_truth": 1}, {"key": "38875041", "model": "cnn_readability_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7608715092413715, "res": {"Yes": 0.7608715092413715, "No": 0.2390975861824042}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_readability_ft_gpt35", "target_model": "llama", "recognition_score": 0.772448422059351, "res": {"Yes": 0.772448422059351, "No": 0.22752367046580577}, "ground_truth": 0}]