[{"key": "33773576", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 4.939324386420328e-06, "res": {"No": 0.9999949190499081, "Yes": 4.939324386420328e-06}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999877668918251, "res": {"Yes": 0.9999877668918251, "No": 1.2173062977626549e-05}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.8140367815546307e-07}, "ground_truth": 1}, {"key": "33773576", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.3497813966867257e-07}, "ground_truth": 0}, {"key": "33773576", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999800187796273, "res": {"Yes": 0.9999800187796273, "No": 1.986637408370128e-05}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.19452490069095568, "res": {"No": 0.805474801426248, "Yes": 0.19452490069095568}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.39204662728536e-06}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999350809073355, "res": {"Yes": 0.9999350809073355, "No": 6.49018129584212e-05}, "ground_truth": 1}, {"key": "37642631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999919389784903, "res": {"Yes": 0.9999919389784903, "No": 8.017018205853713e-06}, "ground_truth": 0}, {"key": "37642631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998061339044606, "res": {"Yes": 0.9998061339044606, "No": 0.00019383582889031013}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.2490197732792904e-05, "res": {"No": 0.9999772771531678, "Yes": 2.2490197732792904e-05}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.87208432044733e-07}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999933694113825, "res": {"Yes": 0.9999933694113825, "No": 6.608399939797316e-06}, "ground_truth": 1}, {"key": "36609836", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999180360292298, "res": {"Yes": 0.9999180360292298, "No": 8.192576709844835e-05}, "ground_truth": 0}, {"key": "36609836", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999959918780326, "res": {"Yes": 0.9999959918780326, "No": 3.908999887238859e-06}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00023433765795312776, "res": {"No": 0.9997656170119853, "Yes": 0.00023433765795312776}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9814121059639296, "res": {"Yes": 0.9814121059639296, "No": 0.01858792690765553}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.01222836531638887, "res": {"No": 0.9877715397935316, "Yes": 0.01222836531638887}, "ground_truth": 1}, {"key": "41035610", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.977194812643873, "res": {"Yes": 0.977194812643873, "No": 0.02280518857118491}, "ground_truth": 0}, {"key": "41035610", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.827037301814858, "res": {"Yes": 0.827037301814858, "No": 0.1729627371294383}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999930118027176, "res": {"Yes": 0.9999930118027176, "No": 6.923798657510219e-06}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9934461743139112, "res": {"Yes": 0.9934461743139112, "No": 0.006553857967874957}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999959918780326, "res": {"Yes": 0.9999959918780326, "No": 3.957583287220746e-06}, "ground_truth": 1}, {"key": "37592684", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 4.1640936919101477e-07}, "ground_truth": 0}, {"key": "37592684", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 7.034626222074366e-06, "res": {"No": 0.999992773397112, "Yes": 7.034626222074366e-06}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9711990265442962, "res": {"Yes": 0.9711990265442962, "No": 0.028800932900107917}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.02934741240405307, "res": {"No": 0.9706524264443396, "Yes": 0.02934741240405307}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9474130443595813, "res": {"Yes": 0.9474130443595813, "No": 0.05258681268931092}, "ground_truth": 1}, {"key": "38951040", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.26698468013489063, "res": {"No": 0.7330153323913449, "Yes": 0.26698468013489063}, "ground_truth": 0}, {"key": "38951040", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9980107757343059, "res": {"Yes": 0.9980107757343059, "No": 0.001989235271063943}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.09760319992341296, "res": {"No": 0.9023967317281988, "Yes": 0.09760319992341296}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.757848144864644, "res": {"Yes": 0.757848144864644, "No": 0.24215167329446283}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8628476231004985, "res": {"Yes": 0.8628476231004985, "No": 0.13715235373343454}, "ground_truth": 1}, {"key": "40774469", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.986194914369173, "res": {"Yes": 0.986194914369173, "No": 0.013805075011052053}, "ground_truth": 0}, {"key": "40774469", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.16528604499693747, "res": {"No": 0.8347138979754111, "Yes": 0.16528604499693747}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.2933523364159869e-06, "res": {"No": 0.9999984951481323, "Yes": 1.2933523364159869e-06}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.40313632451762554, "res": {"No": 0.5968637416990044, "Yes": 0.40313632451762554}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.008726089043007867, "res": {"No": 0.9912738775503703, "Yes": 0.008726089043007867}, "ground_truth": 1}, {"key": "40876288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.15930268614978213, "res": {"No": 0.8406971927736197, "Yes": 0.15930268614978213}, "ground_truth": 0}, {"key": "40876288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 6.528436393815093e-05, "res": {"No": 0.9999346041184038, "Yes": 6.528436393815093e-05}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.978344437859329, "res": {"Yes": 0.978344437859329, "No": 0.02165554364077701}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995406000165021, "res": {"Yes": 0.9995406000165021, "No": 0.0004593257061936573}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988197542385339, "res": {"Yes": 0.9988197542385339, "No": 0.0011801726944311716}, "ground_truth": 1}, {"key": "40340131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999987886094374, "res": {"Yes": 0.999987886094374, "No": 1.2067459808193373e-05}, "ground_truth": 0}, {"key": "40340131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.053964152254544775, "res": {"No": 0.9460356884571929, "Yes": 0.053964152254544775}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0020439470746587583, "res": {"No": 0.9979560363444984, "Yes": 0.0020439470746587583}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.001965514373955245, "res": {"No": 0.9980342839553908, "Yes": 0.001965514373955245}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 2.038553643195458e-06}, "ground_truth": 1}, {"key": "30121591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.987517808939859, "res": {"Yes": 0.987517808939859, "No": 0.012482095768141492}, "ground_truth": 0}, {"key": "30121591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984288827988751, "res": {"Yes": 0.9984288827988751, "No": 0.0015710344362397089}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.057203934385416357, "res": {"No": 0.9427957884465344, "Yes": 0.057203934385416357}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978190475404207, "res": {"Yes": 0.9978190475404207, "No": 0.0021809144885107175}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7529141261372286, "res": {"Yes": 0.7529141261372286, "No": 0.24708573433734016}, "ground_truth": 1}, {"key": "35623366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999871708812939, "res": {"Yes": 0.9999871708812939, "No": 1.2793171576125174e-05}, "ground_truth": 0}, {"key": "35623366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.05031221441716681, "res": {"No": 0.9496875796512673, "Yes": 0.05031221441716681}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.07354302278475919, "res": {"No": 0.9264568754460151, "Yes": 0.07354302278475919}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989961570877414, "res": {"Yes": 0.9989961570877414, "No": 0.0010037658520511133}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994379503091363, "res": {"Yes": 0.9994379503091363, "No": 0.0005619627451705286}, "ground_truth": 1}, {"key": "41014093", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9480972884930792, "res": {"Yes": 0.9480972884930792, "No": 0.051902682718586925}, "ground_truth": 0}, {"key": "41014093", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9935639648709271, "res": {"Yes": 0.9935639648709271, "No": 0.006436077553314723}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 4.087716732111642e-06, "res": {"No": 0.9999958726752174, "Yes": 4.087716732111642e-06}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999839524287637, "res": {"Yes": 0.9999839524287637, "No": 1.5968380656031103e-05}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4492104467696129, "res": {"No": 0.5507894865002431, "Yes": 0.4492104467696129}, "ground_truth": 1}, {"key": "11387984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6281178442741163, "res": {"Yes": 0.6281178442741163, "No": 0.3718821410660227}, "ground_truth": 0}, {"key": "11387984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9926913013916511, "res": {"Yes": 0.9926913013916511, "No": 0.0073087011665628684}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999869324773808, "res": {"Yes": 0.9999869324773808, "No": 1.3025689956754535e-05}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.286703546644927e-07}, "ground_truth": 1}, {"key": "39508312", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999770387506135, "res": {"Yes": 0.9999770387506135, "No": 2.2883349681613656e-05}, "ground_truth": 0}, {"key": "39508312", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999756083404814, "res": {"Yes": 0.9999756083404814, "No": 2.4309508204831642e-05}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 6.14751518349551e-05, "res": {"No": 0.9999384183962248, "Yes": 6.14751518349551e-05}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.49661356029908527, "res": {"No": 0.5033864367145394, "Yes": 0.49661356029908527}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.01943460964568618, "res": {"No": 0.9805653557835609, "Yes": 0.01943460964568618}, "ground_truth": 1}, {"key": "35815369", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999344849262062, "res": {"Yes": 0.9999344849262062, "No": 6.549865171753798e-05}, "ground_truth": 0}, {"key": "35815369", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.46513882944876717, "res": {"No": 0.5348611812791372, "Yes": 0.46513882944876717}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.2823839808520858, "res": {"No": 0.71761593680823, "Yes": 0.2823839808520858}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.4580607645400928, "res": {"No": 0.5419391246469287, "Yes": 0.4580607645400928}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8767006315640339, "res": {"Yes": 0.8767006315640339, "No": 0.12329920703704952}, "ground_truth": 1}, {"key": "35802823", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993835392900295, "res": {"Yes": 0.9993835392900295, "No": 0.0006164017595275997}, "ground_truth": 0}, {"key": "35802823", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8908101138433361, "res": {"Yes": 0.8908101138433361, "No": 0.10918967187975634}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9984986489567917, "res": {"Yes": 0.9984986489567917, "No": 0.0015013022212440753}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.3539452637424768, "res": {"No": 0.6460546572710119, "Yes": 0.3539452637424768}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999917005724405, "res": {"Yes": 0.9999917005724405, "No": 8.176969113766654e-06}, "ground_truth": 1}, {"key": "38499968", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999206582977194, "res": {"Yes": 0.9999206582977194, "No": 7.924898126419338e-05}, "ground_truth": 0}, {"key": "38499968", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999922965856715, "res": {"Yes": 0.9999922965856715, "No": 7.625550815358807e-06}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998543958613116, "res": {"Yes": 0.9998543958613116, "No": 0.00014555813469262086}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999951574563252, "res": {"Yes": 0.9999951574563252, "No": 4.82096713314118e-06}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999987335551019, "res": {"Yes": 0.9999987335551019, "No": 1.2261602737473122e-06}, "ground_truth": 1}, {"key": "36926726", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999980183344636, "res": {"Yes": 0.9999980183344636, "No": 1.8497852623807093e-06}, "ground_truth": 0}, {"key": "36926726", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999309090568892, "res": {"Yes": 0.9999309090568892, "No": 6.899117224707674e-05}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.914409774157431e-06, "res": {"No": 0.9999958726752174, "Yes": 3.914409774157431e-06}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9968962766387662, "res": {"Yes": 0.9968962766387662, "No": 0.0031036855082891986}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 9.806748233437941e-08}, "ground_truth": 1}, {"key": "40903712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997963611372085, "res": {"Yes": 0.9997963611372085, "No": 0.00020358763641682148}, "ground_truth": 0}, {"key": "40903712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00015596233845835815, "res": {"No": 0.9998439111831272, "Yes": 0.00015596233845835815}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.030866587215910676, "res": {"No": 0.96913327097738, "Yes": 0.030866587215910676}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999713171213617, "res": {"Yes": 0.9999713171213617, "No": 2.8553700944023848e-05}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991181047983528, "res": {"Yes": 0.9991181047983528, "No": 0.0008818149775358536}, "ground_truth": 1}, {"key": "19614862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999974223173222, "res": {"Yes": 0.9999974223173222, "No": 2.562326302980328e-06}, "ground_truth": 0}, {"key": "19614862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999959918780326, "res": {"Yes": 0.9999959918780326, "No": 3.9640988693252275e-06}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 8.646430336990252e-06, "res": {"No": 0.9999912237625114, "Yes": 8.646430336990252e-06}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999976607241361, "res": {"Yes": 0.9999976607241361, "No": 2.2682022513374613e-06}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999410407211666, "res": {"Yes": 0.9999410407211666, "No": 5.8898731738021146e-05}, "ground_truth": 1}, {"key": "38861704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.6854684865708375e-07}, "ground_truth": 0}, {"key": "38861704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.41660593142007e-07}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.006383455588254641, "res": {"No": 0.993616331046073, "Yes": 0.006383455588254641}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999821644040562, "res": {"Yes": 0.9999821644040562, "No": 1.7713756798668405e-05}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999902701413353, "res": {"Yes": 0.9999902701413353, "No": 9.667217843290096e-06}, "ground_truth": 1}, {"key": "34349607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999855020530962, "res": {"Yes": 0.9999855020530962, "No": 1.4418607471711756e-05}, "ground_truth": 0}, {"key": "34349607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 6.238393790962063e-08}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9842866710411722, "res": {"Yes": 0.9842866710411722, "No": 0.015713249583725258}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999380608083109, "res": {"Yes": 0.9999380608083109, "No": 6.190794712525171e-05}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.6788156221242212e-06}, "ground_truth": 1}, {"key": "20773800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999871708812939, "res": {"Yes": 0.9999871708812939, "No": 1.277196529995027e-05}, "ground_truth": 0}, {"key": "20773800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999858596579756, "res": {"Yes": 0.9999858596579756, "No": 1.4079791719400577e-05}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9697144114700749, "res": {"Yes": 0.9697144114700749, "No": 0.03028553721672803}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999888397127765, "res": {"Yes": 0.9999888397127765, "No": 1.1051283311019667e-05}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.5752274128385275e-07}, "ground_truth": 1}, {"key": "35545608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.5348130129699475e-06}, "ground_truth": 0}, {"key": "35545608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999944422379444, "res": {"Yes": 0.9999944422379444, "No": 5.481427490275685e-06}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.21383788452373512, "res": {"No": 0.7861620085847354, "Yes": 0.21383788452373512}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999974223173222, "res": {"Yes": 0.9999974223173222, "No": 2.5040127822675875e-06}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 1.9857936361982823e-07}, "ground_truth": 1}, {"key": "37258984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.7006109314829528e-06}, "ground_truth": 0}, {"key": "37258984", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999819260003368, "res": {"Yes": 0.9999819260003368, "No": 1.7973358137059677e-05}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999095732987406, "res": {"Yes": 0.9999095732987406, "No": 9.039857987833401e-05}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.3541543329329877e-07}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9970981793443146, "res": {"Yes": 0.9970981793443146, "No": 0.0029017624070840978}, "ground_truth": 1}, {"key": "37274562", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.4848320243759192e-07}, "ground_truth": 0}, {"key": "37274562", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992623526956373, "res": {"Yes": 0.9992623526956373, "No": 0.0007375873766164867}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9666195444350663, "res": {"Yes": 0.9666195444350663, "No": 0.0333803658717883}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0035374671580476647, "res": {"No": 0.9964622709614932, "Yes": 0.0035374671580476647}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1752643278107317, "res": {"No": 0.8247352691674298, "Yes": 0.1752643278107317}, "ground_truth": 1}, {"key": "40828068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9553266863975449, "res": {"Yes": 0.9553266863975449, "No": 0.044673209369705945}, "ground_truth": 0}, {"key": "40828068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.06883396352253524, "res": {"No": 0.9311657902074256, "Yes": 0.06883396352253524}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9997821825756604, "res": {"Yes": 0.9997821825756604, "No": 0.0002177582620776844}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995840719720543, "res": {"Yes": 0.9995840719720543, "No": 0.00041587825366303806}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998701285740239, "res": {"Yes": 0.9998701285740239, "No": 0.00012980438130346034}, "ground_truth": 1}, {"key": "37807180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9576114536715636, "res": {"Yes": 0.9576114536715636, "No": 0.0423884906723207}, "ground_truth": 0}, {"key": "37807180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9626109218304572, "res": {"Yes": 0.9626109218304572, "No": 0.03738902749849}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0012448764387183932, "res": {"No": 0.9987550666732522, "Yes": 0.0012448764387183932}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.145845184501685, "res": {"No": 0.8541547205490988, "Yes": 0.145845184501685}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9364942003652296, "res": {"Yes": 0.9364942003652296, "No": 0.06350572624897455}, "ground_truth": 1}, {"key": "40748607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997858770875837, "res": {"Yes": 0.9997858770875837, "No": 0.00021399562223445667}, "ground_truth": 0}, {"key": "40748607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6348899513938806, "res": {"Yes": 0.6348899513938806, "No": 0.36510992732099423}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7758879682757926, "res": {"Yes": 0.7758879682757926, "No": 0.22411176514989659}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999940846288958, "res": {"Yes": 0.9999940846288958, "No": 5.806038855982842e-06}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999862172649827, "res": {"Yes": 0.9999862172649827, "No": 1.3704243891469654e-05}, "ground_truth": 1}, {"key": "40123819", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999800187796273, "res": {"Yes": 0.9999800187796273, "No": 1.9935230791441552e-05}, "ground_truth": 0}, {"key": "40123819", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999902701413353, "res": {"Yes": 0.9999902701413353, "No": 9.681240636117828e-06}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.305511493636996e-06, "res": {"No": 0.9999971839107652, "Yes": 2.305511493636996e-06}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996046748615827, "res": {"Yes": 0.9996046748615827, "No": 0.00039527058589704375}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9988680474421706, "res": {"Yes": 0.9988680474421706, "No": 0.001131868468337887}, "ground_truth": 1}, {"key": "38453867", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9955865357845138, "res": {"Yes": 0.9955865357845138, "No": 0.0044135214209918274}, "ground_truth": 0}, {"key": "38453867", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8503545319895744, "res": {"Yes": 0.8503545319895744, "No": 0.14964539753765063}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.991414459075299, "res": {"Yes": 0.991414459075299, "No": 0.008585501246704125}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7318490515612034, "res": {"Yes": 0.7318490515612034, "No": 0.26815087244171065}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9647919622935727, "res": {"Yes": 0.9647919622935727, "No": 0.03520802286666501}, "ground_truth": 1}, {"key": "38944856", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9903007035637176, "res": {"Yes": 0.9903007035637176, "No": 0.009699201659540926}, "ground_truth": 0}, {"key": "38944856", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0025707412436675866, "res": {"No": 0.9974291964897928, "Yes": 0.0025707412436675866}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.36382965560097486, "res": {"No": 0.6361703344738668, "Yes": 0.36382965560097486}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9837799381819938, "res": {"Yes": 0.9837799381819938, "No": 0.016220019955395074}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9780562844900197, "res": {"Yes": 0.9780562844900197, "No": 0.02194366920430427}, "ground_truth": 1}, {"key": "35778898", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9671951791792134, "res": {"Yes": 0.9671951791792134, "No": 0.0328046173707901}, "ground_truth": 0}, {"key": "35778898", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999444856549178, "res": {"Yes": 0.999444856549178, "No": 0.0005550571369818114}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0648859412800876, "res": {"No": 0.9351139831604908, "Yes": 0.0648859412800876}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.3938581616190232e-06}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.904908583668901e-07}, "ground_truth": 1}, {"key": "32530125", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991739195924446, "res": {"Yes": 0.9991739195924446, "No": 0.0008259985829513782}, "ground_truth": 0}, {"key": "32530125", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4396133318252457e-06}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00019976337836824054, "res": {"No": 0.9998001748876978, "Yes": 0.00019976337836824054}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984835548666535, "res": {"Yes": 0.9984835548666535, "No": 0.00151646895882994}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.625921368269309e-07}, "ground_truth": 1}, {"key": "35010363", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.85273838054713e-07}, "ground_truth": 0}, {"key": "35010363", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.7147728981716544e-07}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9473318355940762, "res": {"Yes": 0.9473318355940762, "No": 0.05266803257453816}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997531146312096, "res": {"Yes": 0.9997531146312096, "No": 0.0002468627608109046}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.993663529240838, "res": {"Yes": 0.993663529240838, "No": 0.006336470937342865}, "ground_truth": 1}, {"key": "27514800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999390143796986, "res": {"Yes": 0.9999390143796986, "No": 6.0892411312677506e-05}, "ground_truth": 0}, {"key": "27514800", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982264324330448, "res": {"Yes": 0.9982264324330448, "No": 0.001773598048441903}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9974682120948357, "res": {"Yes": 0.9974682120948357, "No": 0.0025318146003289817}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.99996356913662, "res": {"Yes": 0.99996356913662, "No": 3.6349649369036584e-05}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.1896991302836553e-07}, "ground_truth": 1}, {"key": "25725840", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.2557005838322487e-07}, "ground_truth": 0}, {"key": "25725840", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998138806723514, "res": {"Yes": 0.9998138806723514, "No": 0.00018608965206992484}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9992248575782243, "res": {"Yes": 0.9992248575782243, "No": 0.0007750910900262056}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998123313119718, "res": {"Yes": 0.9998123313119718, "No": 0.00018763893505295594}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980347596186439, "res": {"Yes": 0.9980347596186439, "No": 0.001965170439034987}, "ground_truth": 1}, {"key": "38327225", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990330262207494, "res": {"Yes": 0.9990330262207494, "No": 0.0009668772592384844}, "ground_truth": 0}, {"key": "38327225", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999036136754603, "res": {"Yes": 0.9999036136754603, "No": 9.63350826199708e-05}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.20576710664779366, "res": {"No": 0.7942328410753251, "Yes": 0.20576710664779366}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999949190499081, "res": {"Yes": 0.9999949190499081, "No": 4.962234076431889e-06}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998475234238315, "res": {"Yes": 0.998475234238315, "No": 0.0015247399622800985}, "ground_truth": 1}, {"key": "11991724", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997392941696727, "res": {"Yes": 0.9997392941696727, "No": 0.00026063124606014046}, "ground_truth": 0}, {"key": "11991724", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999903893441826, "res": {"Yes": 0.9999903893441826, "No": 9.525329922676856e-06}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.005109445977092511, "res": {"No": 0.9948905860886486, "Yes": 0.005109445977092511}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999983237218497, "res": {"Yes": 0.999983237218497, "No": 1.6741096387097703e-05}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999953958625991, "res": {"Yes": 0.9999953958625991, "No": 4.510863316686778e-06}, "ground_truth": 1}, {"key": "32217545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 5.7250011135816704e-08}, "ground_truth": 0}, {"key": "32217545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988173766508207, "res": {"Yes": 0.9988173766508207, "No": 0.0011825359930076225}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0079491124345605, "res": {"No": 0.9920506495366742, "Yes": 0.0079491124345605}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.4761460201977256e-07}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8481962865390337, "res": {"Yes": 0.8481962865390337, "No": 0.15180370609356836}, "ground_truth": 1}, {"key": "12731847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998874036694427, "res": {"Yes": 0.9998874036694427, "No": 0.00011255528891759168}, "ground_truth": 0}, {"key": "12731847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.5702387193220876, "res": {"Yes": 0.5702387193220876, "No": 0.42976114559009515}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 4.0687041494720026e-06, "res": {"No": 0.9999958726752174, "Yes": 4.0687041494720026e-06}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8227833065474496, "res": {"Yes": 0.8227833065474496, "No": 0.17721657620700076}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.013677269290235433, "res": {"No": 0.9863225796462424, "Yes": 0.013677269290235433}, "ground_truth": 1}, {"key": "36827234", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995245187370612, "res": {"Yes": 0.9995245187370612, "No": 0.0004754506342406533}, "ground_truth": 0}, {"key": "36827234", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.1367537795049745, "res": {"No": 0.8632462040495105, "Yes": 0.1367537795049745}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.015782966343819912, "res": {"No": 0.9842170342383751, "Yes": 0.015782966343819912}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.06480150827798223, "res": {"No": 0.9351984277657868, "Yes": 0.06480150827798223}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0001024455622980851, "res": {"No": 0.9998975348899081, "Yes": 0.0001024455622980851}, "ground_truth": 1}, {"key": "29111539", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.012245839895940991, "res": {"No": 0.9877540889878902, "Yes": 0.012245839895940991}, "ground_truth": 0}, {"key": "29111539", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.011168472784528077, "res": {"No": 0.9888314594480321, "Yes": 0.011168472784528077}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.15741695966164249, "res": {"No": 0.8425830297326983, "Yes": 0.15741695966164249}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999888397127765, "res": {"Yes": 0.9999888397127765, "No": 1.1071414960890103e-05}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.919965676308944e-07}, "ground_truth": 1}, {"key": "37763052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6267606184531839, "res": {"Yes": 0.6267606184531839, "No": 0.3732393037648431}, "ground_truth": 0}, {"key": "37763052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9711064960804212, "res": {"Yes": 0.9711064960804212, "No": 0.028893373523470427}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997892104192462, "res": {"Yes": 0.9997892104192462, "No": 0.00021071564234898972}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997773718149654, "res": {"Yes": 0.997773718149654, "No": 0.0022262983621563898}, "ground_truth": 1}, {"key": "30682335", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 8.280379800298122e-09}, "ground_truth": 0}, {"key": "30682335", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9976422394939995, "res": {"Yes": 0.9976422394939995, "No": 0.002357776181875214}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6635385937391476, "res": {"Yes": 0.6635385937391476, "No": 0.336461314784324}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996174247006003, "res": {"Yes": 0.9996174247006003, "No": 0.0003825433415022154}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 7.220084460440899e-07}, "ground_truth": 1}, {"key": "12261276", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.76663464219807e-07}, "ground_truth": 0}, {"key": "12261276", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.683587588034513e-07}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.004495225704374576, "res": {"No": 0.9955047646514879, "Yes": 0.004495225704374576}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.9580071393595487e-07}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 8.934996384372331e-08}, "ground_truth": 1}, {"key": "36912979", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.598311295982821e-07}, "ground_truth": 0}, {"key": "36912979", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 1.1606193023056919e-08}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9948811462135962, "res": {"Yes": 0.9948811462135962, "No": 0.00511868350972691}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999753699393249, "res": {"Yes": 0.9999753699393249, "No": 2.4516897114240412e-05}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999876476902904, "res": {"Yes": 0.9999876476902904, "No": 1.2234814776589076e-05}, "ground_truth": 1}, {"key": "30205259", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9738565192719414, "res": {"Yes": 0.9738565192719414, "No": 0.026143272169133355}, "ground_truth": 0}, {"key": "30205259", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996051515131895, "res": {"Yes": 0.9996051515131895, "No": 0.00039480207286531516}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.855671780812605, "res": {"Yes": 0.855671780812605, "No": 0.14432771016536727}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996209957902479, "res": {"Yes": 0.9996209957902479, "No": 0.00037892384869366946}, "ground_truth": 1}, {"key": "39458032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.49877339729934783, "res": {"No": 0.501226256530995, "Yes": 0.49877339729934783}, "ground_truth": 0}, {"key": "39458032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9967580385427447, "res": {"Yes": 0.9967580385427447, "No": 0.003241779083604956}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9943246470100051, "res": {"Yes": 0.9943246470100051, "No": 0.0056753706782186625}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.10840262222517812, "res": {"No": 0.891597296200729, "Yes": 0.10840262222517812}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.7071695130851256e-07}, "ground_truth": 1}, {"key": "35116452", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999995276659155, "res": {"Yes": 0.999995276659155, "No": 4.682136664403521e-06}, "ground_truth": 0}, {"key": "35116452", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993040111127034, "res": {"Yes": 0.9993040111127034, "No": 0.0006958871858943425}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8875624623468528, "res": {"Yes": 0.8875624623468528, "No": 0.11243744010134234}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8098570243856984, "res": {"Yes": 0.8098570243856984, "No": 0.19014297306202857}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9414731797631789, "res": {"Yes": 0.9414731797631789, "No": 0.05852676546867022}, "ground_truth": 1}, {"key": "40107476", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8007839048674346, "res": {"Yes": 0.8007839048674346, "No": 0.19921608282846798}, "ground_truth": 0}, {"key": "40107476", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.18206223496498136, "res": {"No": 0.8179376972590969, "Yes": 0.18206223496498136}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9993543711080838, "res": {"Yes": 0.9993543711080838, "No": 0.0006456002847151732}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999641651360841, "res": {"Yes": 0.9999641651360841, "No": 3.575047507862383e-05}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 1.0160825114991958e-06}, "ground_truth": 1}, {"key": "39501049", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9839227806090595, "res": {"Yes": 0.9839227806090595, "No": 0.016077234722719175}, "ground_truth": 0}, {"key": "39501049", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.958503864197125, "res": {"Yes": 0.958503864197125, "No": 0.04149609303135763}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0007798862361559931, "res": {"No": 0.9992199814327705, "Yes": 0.0007798862361559931}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9982895169464311, "res": {"Yes": 0.9982895169464311, "No": 0.0017104787104739749}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999775151112301, "res": {"Yes": 0.999775151112301, "No": 0.0002248086414656647}, "ground_truth": 1}, {"key": "39642178", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.3391604092125018, "res": {"No": 0.6608395743661424, "Yes": 0.3391604092125018}, "ground_truth": 0}, {"key": "39642178", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971001962765517, "res": {"Yes": 0.9971001962765517, "No": 0.002899787849530504}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.1529724253963555, "res": {"No": 0.8470274723231008, "Yes": 0.1529724253963555}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999987335551019, "res": {"Yes": 0.9999987335551019, "No": 1.144294806746689e-06}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.2462046481232326e-07}, "ground_truth": 1}, {"key": "38024796", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.4259355875606232e-07}, "ground_truth": 0}, {"key": "38024796", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 5.7856675309396365e-08}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999864556687252, "res": {"Yes": 0.9999864556687252, "No": 1.3490335739852662e-05}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999953958625991, "res": {"Yes": 0.9999953958625991, "No": 4.576884644085709e-06}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999959918780326, "res": {"Yes": 0.9999959918780326, "No": 3.9525010587277945e-06}, "ground_truth": 1}, {"key": "36652079", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.7887329566057775e-07}, "ground_truth": 0}, {"key": "36652079", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.5434245524479662, "res": {"Yes": 0.5434245524479662, "No": 0.4565753647597539}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.000645063755704476, "res": {"No": 0.9993548476403357, "Yes": 0.000645063755704476}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999985978860297, "res": {"Yes": 0.999985978860297, "No": 1.3941396197603904e-05}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9723100887990543, "res": {"Yes": 0.9723100887990543, "No": 0.027689846093849415}, "ground_truth": 1}, {"key": "32193402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974701110766255, "res": {"Yes": 0.9974701110766255, "No": 0.0025298693952652334}, "ground_truth": 0}, {"key": "32193402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.7361546500318366, "res": {"Yes": 0.7361546500318366, "No": 0.263845308559281}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.11403737881361561, "res": {"No": 0.8859623355026668, "Yes": 0.11403737881361561}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8669786046127796, "res": {"Yes": 0.8669786046127796, "No": 0.13302091599561602}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994872520401881, "res": {"Yes": 0.9994872520401881, "No": 0.0005127394687419433}, "ground_truth": 1}, {"key": "32589706", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995348808814496, "res": {"Yes": 0.9995348808814496, "No": 0.00046496087300151195}, "ground_truth": 0}, {"key": "32589706", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9970775678429188, "res": {"Yes": 0.9970775678429188, "No": 0.0029222628914653275}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.46435877665090397, "res": {"No": 0.5356411919903562, "Yes": 0.46435877665090397}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9482969569978578, "res": {"Yes": 0.9482969569978578, "No": 0.05170294685306364}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9954663772346486, "res": {"Yes": 0.9954663772346486, "No": 0.004533643763545576}, "ground_truth": 1}, {"key": "38590589", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996699528075618, "res": {"Yes": 0.9996699528075618, "No": 0.00032993364482835665}, "ground_truth": 0}, {"key": "38590589", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.3851243768934047, "res": {"No": 0.6148755250214702, "Yes": 0.3851243768934047}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0006752452498298266, "res": {"No": 0.9993246081798017, "Yes": 0.0006752452498298266}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9890900657632545, "res": {"Yes": 0.9890900657632545, "No": 0.01090981975887526}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9942981210691967, "res": {"Yes": 0.9942981210691967, "No": 0.005701910413683199}, "ground_truth": 1}, {"key": "37045414", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9774569324186405, "res": {"Yes": 0.9774569324186405, "No": 0.022543046946075004}, "ground_truth": 0}, {"key": "37045414", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.006397576706039138, "res": {"No": 0.9936024393932585, "Yes": 0.006397576706039138}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 8.476769863966706e-05, "res": {"No": 0.9999149369980623, "Yes": 8.476769863966706e-05}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 4.51063819862191e-07, "res": {"No": 0.9999992103693117, "Yes": 4.51063819862191e-07}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.002684939725168771, "res": {"No": 0.9973147635144788, "Yes": 0.002684939725168771}, "ground_truth": 1}, {"key": "33310095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.03146331547202548, "res": {"No": 0.9685362168969768, "Yes": 0.03146331547202548}, "ground_truth": 0}, {"key": "33310095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.06420460768931642, "res": {"No": 0.935794764728354, "Yes": 0.06420460768931642}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0004648670998507674, "res": {"No": 0.9995350000659958, "Yes": 0.0004648670998507674}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999775155557789, "res": {"Yes": 0.9999775155557789, "No": 2.239483961441502e-05}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999907469518097, "res": {"Yes": 0.9999907469518097, "No": 9.20884613017693e-06}, "ground_truth": 1}, {"key": "37934604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.8533066732772002e-06}, "ground_truth": 0}, {"key": "37934604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999313858390593, "res": {"Yes": 0.9999313858390593, "No": 6.854918782139182e-05}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0001034408092660752, "res": {"No": 0.9998963429787603, "Yes": 0.0001034408092660752}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9975762706865732, "res": {"Yes": 0.9975762706865732, "No": 0.0024236410582971217}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.04269099375844806, "res": {"No": 0.9573087469186162, "Yes": 0.04269099375844806}, "ground_truth": 1}, {"key": "39012181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8430972380540358, "res": {"Yes": 0.8430972380540358, "No": 0.15690252912963404}, "ground_truth": 0}, {"key": "39012181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00909639588958337, "res": {"No": 0.990903494828499, "Yes": 0.00909639588958337}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999915813694369, "res": {"Yes": 0.9999915813694369, "No": 8.351043974754648e-06}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999967070975216, "res": {"Yes": 0.9999967070975216, "No": 3.2596556402182036e-06}, "ground_truth": 1}, {"key": "40221674", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999890781166442, "res": {"Yes": 0.9999890781166442, "No": 1.0826183064763565e-05}, "ground_truth": 0}, {"key": "40221674", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997359573653939, "res": {"Yes": 0.9997359573653939, "No": 0.0002640286336246403}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.32043398463989164, "res": {"No": 0.6795656533296528, "Yes": 0.32043398463989164}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 1.095466782654992e-06}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993880662079002, "res": {"Yes": 0.9993880662079002, "No": 0.0006117731586270227}, "ground_truth": 1}, {"key": "36884862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999609202831114, "res": {"Yes": 0.999609202831114, "No": 0.00039071049274229483}, "ground_truth": 0}, {"key": "36884862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998024393176823, "res": {"Yes": 0.9998024393176823, "No": 0.00019746148604630242}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9323577462869047, "res": {"Yes": 0.9323577462869047, "No": 0.0676421208821868}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9873447527214548, "res": {"Yes": 0.9873447527214548, "No": 0.012655230133078284}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8032725563688414, "res": {"Yes": 0.8032725563688414, "No": 0.19672731439689434}, "ground_truth": 1}, {"key": "39054429", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7842544168389135, "res": {"Yes": 0.7842544168389135, "No": 0.21574545829856673}, "ground_truth": 0}, {"key": "39054429", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988772011108994, "res": {"Yes": 0.9988772011108994, "No": 0.0011228005765316143}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.08197561122848931, "res": {"No": 0.9180242615565868, "Yes": 0.08197561122848931}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999980183344636, "res": {"Yes": 0.9999980183344636, "No": 1.951847886515205e-06}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.994892591093667, "res": {"Yes": 0.994892591093667, "No": 0.005107431719680689}, "ground_truth": 1}, {"key": "36753964", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 7.488882975486907e-07}, "ground_truth": 0}, {"key": "36753964", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999706019221319, "res": {"Yes": 0.9999706019221319, "No": 2.936761562736914e-05}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9627833774719902, "res": {"Yes": 0.9627833774719902, "No": 0.03721641319836298}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997166553096911, "res": {"Yes": 0.9997166553096911, "No": 0.00028333149086459664}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994267587655735, "res": {"Yes": 0.9994267587655735, "No": 0.0005732125314412601}, "ground_truth": 1}, {"key": "37612459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999598739650709, "res": {"Yes": 0.9999598739650709, "No": 4.001160583738117e-05}, "ground_truth": 0}, {"key": "37612459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9990332643602803, "res": {"Yes": 0.9990332643602803, "No": 0.0009666897032437114}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.989773367279527, "res": {"Yes": 0.989773367279527, "No": 0.01022645284107495}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9497285491074502, "res": {"Yes": 0.9497285491074502, "No": 0.050271216612949365}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9963524276132634, "res": {"Yes": 0.9963524276132634, "No": 0.0036475885535017763}, "ground_truth": 1}, {"key": "36805789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990509977277514, "res": {"Yes": 0.9990509977277514, "No": 0.0009489784193726542}, "ground_truth": 0}, {"key": "36805789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996987836547553, "res": {"Yes": 0.9996987836547553, "No": 0.0003010693262402101}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997856387386591, "res": {"Yes": 0.9997856387386591, "No": 0.00021426092713285012}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9967312669781179, "res": {"Yes": 0.9967312669781179, "No": 0.003268774941151367}, "ground_truth": 1}, {"key": "12757394", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999468813708443, "res": {"Yes": 0.9999468813708443, "No": 5.3093714909931155e-05}, "ground_truth": 0}, {"key": "12757394", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996355222181708, "res": {"Yes": 0.9996355222181708, "No": 0.00036434876625760155}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0001344544604862704, "res": {"No": 0.9998654802485932, "Yes": 0.0001344544604862704}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.00939840767811975, "res": {"No": 0.9906014778059189, "Yes": 0.00939840767811975}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.18722727982400508, "res": {"No": 0.8127727083881563, "Yes": 0.18722727982400508}, "ground_truth": 1}, {"key": "32192542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9961782652879141, "res": {"Yes": 0.9961782652879141, "No": 0.0038216943789729572}, "ground_truth": 0}, {"key": "32192542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999839524287637, "res": {"Yes": 0.9999839524287637, "No": 1.5961739191198667e-05}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.012821792713749254, "res": {"No": 0.9871781286594592, "Yes": 0.012821792713749254}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9933235904209057, "res": {"Yes": 0.9933235904209057, "No": 0.00667638904310197}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999584435804919, "res": {"Yes": 0.9999584435804919, "No": 4.14411586791389e-05}, "ground_truth": 1}, {"key": "34856060", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999918197754583, "res": {"Yes": 0.9999918197754583, "No": 8.056897508918253e-06}, "ground_truth": 0}, {"key": "34856060", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.011587874839557408, "res": {"No": 0.9884120228399389, "Yes": 0.011587874839557408}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.53788393356906e-07}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.4014384730712781, "res": {"No": 0.5985615612753463, "Yes": 0.4014384730712781}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999828796125555, "res": {"Yes": 0.9999828796125555, "No": 1.7017437573531096e-05}, "ground_truth": 1}, {"key": "36083416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.23718493095641e-07}, "ground_truth": 0}, {"key": "36083416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.993892990751873, "res": {"Yes": 0.993892990751873, "No": 0.006107023968441175}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9558851204926906, "res": {"Yes": 0.9558851204926906, "No": 0.04411490375476545}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9780835511231866, "res": {"Yes": 0.9780835511231866, "No": 0.02191641893504961}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 2.0396506801319736e-06}, "ground_truth": 1}, {"key": "33839050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999576091905158, "res": {"Yes": 0.9999576091905158, "No": 4.227528168685732e-05}, "ground_truth": 0}, {"key": "33839050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999531988512079, "res": {"Yes": 0.9999531988512079, "No": 4.6674620465483646e-05}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.002248942889630285, "res": {"No": 0.997751048688975, "Yes": 0.002248942889630285}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998670296813366, "res": {"Yes": 0.9998670296813366, "No": 0.00013287164113547892}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999910407653634, "res": {"Yes": 0.999910407653634, "No": 8.953759186764454e-05}, "ground_truth": 1}, {"key": "18464690", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9983913364884552, "res": {"Yes": 0.9983913364884552, "No": 0.0016086290250267954}, "ground_truth": 0}, {"key": "18464690", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999407942934993, "res": {"Yes": 0.999407942934993, "No": 0.0005920135706190583}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.2481722871639943e-05, "res": {"No": 0.9999675027220479, "Yes": 3.2481722871639943e-05}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9163542621537568, "res": {"Yes": 0.9163542621537568, "No": 0.08364560443759028}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994993973733282, "res": {"Yes": 0.9994993973733282, "No": 0.0005005890765098613}, "ground_truth": 1}, {"key": "39212665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990055537896876, "res": {"Yes": 0.9990055537896876, "No": 0.0009943766495424348}, "ground_truth": 0}, {"key": "39212665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999366304579342, "res": {"Yes": 0.9999366304579342, "No": 6.332305988321733e-05}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.07680327473184449, "res": {"No": 0.923196725626175, "Yes": 0.07680327473184449}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0001998958654026974, "res": {"No": 0.9998000557215221, "Yes": 0.0001998958654026974}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0083817546580858, "res": {"No": 0.9916181462686406, "Yes": 0.0083817546580858}, "ground_truth": 1}, {"key": "40094011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9271313220177799, "res": {"Yes": 0.9271313220177799, "No": 0.07286856063496279}, "ground_truth": 0}, {"key": "40094011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.029610545920712862, "res": {"No": 0.970389352201086, "Yes": 0.029610545920712862}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0054381758284558586, "res": {"No": 0.9945618356441425, "Yes": 0.0054381758284558586}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0017266036641302679, "res": {"No": 0.9982733587630783, "Yes": 0.0017266036641302679}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.29710573304949695, "res": {"No": 0.7028941974440657, "Yes": 0.29710573304949695}, "ground_truth": 1}, {"key": "36036272", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987279553355669, "res": {"Yes": 0.9987279553355669, "No": 0.0012720030706933779}, "ground_truth": 0}, {"key": "36036272", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9917655225835752, "res": {"Yes": 0.9917655225835752, "No": 0.00823441628561655}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.3766607706681522e-05, "res": {"No": 0.9999760851449647, "Yes": 2.3766607706681522e-05}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 1.0420673306229366e-06}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997746743996271, "res": {"Yes": 0.9997746743996271, "No": 0.00022524474305877495}, "ground_truth": 1}, {"key": "30681904", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999470005685195, "res": {"Yes": 0.9999470005685195, "No": 5.2938589758875674e-05}, "ground_truth": 0}, {"key": "30681904", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999706019221319, "res": {"Yes": 0.9999706019221319, "No": 2.929399534425099e-05}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 9.666575893612432e-07, "res": {"No": 0.9999987335551019, "Yes": 9.666575893612432e-07}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.426227543541082e-07}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.1072391347609186e-07}, "ground_truth": 1}, {"key": "27834240", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.2959741489824198e-07}, "ground_truth": 0}, {"key": "27834240", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.7037525757913603e-07}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00045723594924039696, "res": {"No": 0.9995427374164156, "Yes": 0.00045723594924039696}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7013888066403441, "res": {"Yes": 0.7013888066403441, "No": 0.2986111958815734}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999565364005696, "res": {"Yes": 0.9999565364005696, "No": 4.339310501939607e-05}, "ground_truth": 1}, {"key": "35025075", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5172841718826168, "res": {"Yes": 0.5172841718826168, "No": 0.4827158213868655}, "ground_truth": 0}, {"key": "35025075", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8302465866211813, "res": {"Yes": 0.8302465866211813, "No": 0.16975344808925014}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9857686852895442, "res": {"Yes": 0.9857686852895442, "No": 0.014231321557071248}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9943190976996354, "res": {"Yes": 0.9943190976996354, "No": 0.005680840964944074}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999933694113825, "res": {"Yes": 0.9999933694113825, "No": 6.512676822537618e-06}, "ground_truth": 1}, {"key": "33316985", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999537948404913, "res": {"Yes": 0.9999537948404913, "No": 4.609025585698646e-05}, "ground_truth": 0}, {"key": "33316985", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999938462231346, "res": {"Yes": 0.9999938462231346, "No": 6.040595247275144e-06}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0005903883601886396, "res": {"No": 0.9994094917186823, "Yes": 0.0005903883601886396}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.1887632339675485e-07}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990865698315521, "res": {"Yes": 0.9990865698315521, "No": 0.0009133841592360591}, "ground_truth": 1}, {"key": "17037056", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4091751848819629e-06}, "ground_truth": 0}, {"key": "17037056", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9421048150171164, "res": {"Yes": 0.9421048150171164, "No": 0.05789519417540249}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.16772175380346782, "res": {"No": 0.8322779495274033, "Yes": 0.16772175380346782}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999940846288958, "res": {"Yes": 0.9999940846288958, "No": 5.812818458456388e-06}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999950382530095, "res": {"Yes": 0.9999950382530095, "No": 4.907789113246229e-06}, "ground_truth": 1}, {"key": "34050457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999964686909351, "res": {"Yes": 0.9999964686909351, "No": 3.402214550461167e-06}, "ground_truth": 0}, {"key": "34050457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.005130703985870519, "res": {"No": 0.9948689964012755, "Yes": 0.005130703985870519}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.776188520123632, "res": {"Yes": 0.776188520123632, "No": 0.22381149983419113}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996136116672062, "res": {"Yes": 0.9996136116672062, "No": 0.0003863476292032156}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999175592584247, "res": {"Yes": 0.9999175592584247, "No": 8.238398473099109e-05}, "ground_truth": 1}, {"key": "34713745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.996227130424918, "res": {"Yes": 0.996227130424918, "No": 0.0037729050649682456}, "ground_truth": 0}, {"key": "34713745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997445341369622, "res": {"Yes": 0.9997445341369622, "No": 0.00025543642630642993}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0003322745410145311, "res": {"No": 0.9996676886676463, "Yes": 0.0003322745410145311}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.1403781256138127, "res": {"No": 0.8596217689698066, "Yes": 0.1403781256138127}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.936386111760336, "res": {"Yes": 0.936386111760336, "No": 0.0636137905241518}, "ground_truth": 1}, {"key": "40856210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996015841586785, "res": {"Yes": 0.9996015841586785, "No": 0.00039834969810574665}, "ground_truth": 0}, {"key": "40856210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999189987897066, "res": {"Yes": 0.999189987897066, "No": 0.0008099459831424138}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 6.321784114825875e-05, "res": {"No": 0.9999366304579342, "Yes": 6.321784114825875e-05}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 1.0023162363046008e-06}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999974223173222, "res": {"Yes": 0.9999974223173222, "No": 2.4458349511992215e-06}, "ground_truth": 1}, {"key": "40848302", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995096401657008, "res": {"Yes": 0.9995096401657008, "No": 0.0004902475942941557}, "ground_truth": 0}, {"key": "40848302", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.1064531425395017e-06}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.2420926249242934e-06, "res": {"No": 0.9999984951481323, "Yes": 1.2420926249242934e-06}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 2.996531814153732e-06}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.234041685892874e-07}, "ground_truth": 1}, {"key": "40636168", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 8.381398147484029e-08}, "ground_truth": 0}, {"key": "40636168", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999820452021894, "res": {"Yes": 0.9999820452021894, "No": 1.783975792733576e-05}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 5.346357377361929e-05, "res": {"No": 0.9999464045822857, "Yes": 5.346357377361929e-05}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999691715222073, "res": {"Yes": 0.9999691715222073, "No": 3.078084429323725e-05}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99756346817414, "res": {"Yes": 0.99756346817414, "No": 0.00243657868969672}, "ground_truth": 1}, {"key": "34423311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9780394092524702, "res": {"Yes": 0.9780394092524702, "No": 0.02196053939562851}, "ground_truth": 0}, {"key": "34423311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999800187796273, "res": {"Yes": 0.9999800187796273, "No": 1.9922765203600536e-05}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.1395240348123119, "res": {"No": 0.8604754273367906, "Yes": 0.1395240348123119}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9918334122488929, "res": {"Yes": 0.9918334122488929, "No": 0.00816643677904879}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.24134464616231718, "res": {"No": 0.7586547651038742, "Yes": 0.24134464616231718}, "ground_truth": 1}, {"key": "34833945", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.03325674417889579, "res": {"No": 0.9667426367715719, "Yes": 0.03325674417889579}, "ground_truth": 0}, {"key": "34833945", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.01365017413895422, "res": {"No": 0.9863492491830307, "Yes": 0.01365017413895422}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 6.539256441009649e-05, "res": {"No": 0.9999343657340227, "Yes": 6.539256441009649e-05}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999828796125555, "res": {"Yes": 0.9999828796125555, "No": 1.7100736931070503e-05}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.7383346513027888e-06}, "ground_truth": 1}, {"key": "21272328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999807339855921, "res": {"Yes": 0.9999807339855921, "No": 1.9176365514001587e-05}, "ground_truth": 0}, {"key": "21272328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.2454818660137976, "res": {"No": 0.7545180937111089, "Yes": 0.2454818660137976}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00023850506761499416, "res": {"No": 0.999761326687008, "Yes": 0.00023850506761499416}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990191185789906, "res": {"Yes": 0.9990191185789906, "No": 0.0009808092124841716}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9736001784694831, "res": {"Yes": 0.9736001784694831, "No": 0.02639972725851735}, "ground_truth": 1}, {"key": "38648957", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998850198707218, "res": {"Yes": 0.9998850198707218, "No": 0.0001149479661794894}, "ground_truth": 0}, {"key": "38648957", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989074087129792, "res": {"Yes": 0.9989074087129792, "No": 0.0010925184972681104}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9993869940049946, "res": {"Yes": 0.9993869940049946, "No": 0.0006129406166797167}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9985712623188803, "res": {"Yes": 0.9985712623188803, "No": 0.0014286513380111403}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999054015547151, "res": {"Yes": 0.9999054015547151, "No": 9.453362184708793e-05}, "ground_truth": 1}, {"key": "24942981", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999826412106655, "res": {"Yes": 0.9999826412106655, "No": 1.724662647981572e-05}, "ground_truth": 0}, {"key": "24942981", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8060964972553004, "res": {"Yes": 0.8060964972553004, "No": 0.19390349347610206}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.996323680271395, "res": {"Yes": 0.996323680271395, "No": 0.0036763145852804937}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999886013079656, "res": {"Yes": 0.9999886013079656, "No": 1.1307062810685705e-05}, "ground_truth": 1}, {"key": "35882366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992804402074026, "res": {"Yes": 0.9992804402074026, "No": 0.0007195585204924661}, "ground_truth": 0}, {"key": "35882366", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.10919897523611785, "res": {"No": 0.8908009430004211, "Yes": 0.10919897523611785}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.3716116906953353e-05, "res": {"No": 0.9999862172649827, "Yes": 1.3716116906953353e-05}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9906421933539773, "res": {"Yes": 0.9906421933539773, "No": 0.009357725688644182}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.6482460632993374e-06}, "ground_truth": 1}, {"key": "40559523", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999983356420506, "res": {"Yes": 0.999983356420506, "No": 1.658005650899943e-05}, "ground_truth": 0}, {"key": "40559523", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982197798749761, "res": {"Yes": 0.9982197798749761, "No": 0.0017801885381113953}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.3328992070667577e-06, "res": {"No": 0.9999965878943212, "Yes": 3.3328992070667577e-06}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9968266204466469, "res": {"Yes": 0.9968266204466469, "No": 0.0031733451344963365}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999994561441089, "res": {"Yes": 0.999994561441089, "No": 5.415252764622964e-06}, "ground_truth": 1}, {"key": "24632722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999987335551019, "res": {"Yes": 0.9999987335551019, "No": 1.241684043665995e-06}, "ground_truth": 0}, {"key": "24632722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999930118027176, "res": {"Yes": 0.9999930118027176, "No": 6.914983354560864e-06}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.998131772214123, "res": {"Yes": 0.998131772214123, "No": 0.0018681913661813378}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9864648955480623, "res": {"Yes": 0.9864648955480623, "No": 0.013535050836416807}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9948114134584859, "res": {"Yes": 0.9948114134584859, "No": 0.0051886242189448754}, "ground_truth": 1}, {"key": "36002759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997136760385316, "res": {"Yes": 0.9997136760385316, "No": 0.0002862706116282213}, "ground_truth": 0}, {"key": "36002759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981751169276313, "res": {"Yes": 0.9981751169276313, "No": 0.0018249105624961164}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0045133405554221885, "res": {"No": 0.9954866999877313, "Yes": 0.0045133405554221885}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992998419251358, "res": {"Yes": 0.9992998419251358, "No": 0.0007001259573755786}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.048547246528168546, "res": {"No": 0.9514527289852683, "Yes": 0.048547246528168546}, "ground_truth": 1}, {"key": "29508534", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998356874507859, "res": {"Yes": 0.9998356874507859, "No": 0.0001642503121737734}, "ground_truth": 0}, {"key": "29508534", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.659107547300217e-06}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.013877607625980259, "res": {"No": 0.9861223449279671, "Yes": 0.013877607625980259}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.8266539179273516e-07}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.6805340855495598e-07}, "ground_truth": 1}, {"key": "15631612", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 4.6405817890648285e-08}, "ground_truth": 0}, {"key": "15631612", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999987335551019, "res": {"Yes": 0.9999987335551019, "No": 1.1407712376988906e-06}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0010151021816287588, "res": {"No": 0.9989848552084483, "Yes": 0.0010151021816287588}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999814491960682, "res": {"Yes": 0.9999814491960682, "No": 1.8459636874872966e-05}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998522505060318, "res": {"Yes": 0.9998522505060318, "No": 0.00014763419488016745}, "ground_truth": 1}, {"key": "40731892", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998154300351321, "res": {"Yes": 0.9998154300351321, "No": 0.0001844874718576109}, "ground_truth": 0}, {"key": "40731892", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999902701413353, "res": {"Yes": 0.9999902701413353, "No": 9.65844399341905e-06}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999753699393249, "res": {"Yes": 0.9999753699393249, "No": 2.4514273946591163e-05}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9917315155268602, "res": {"Yes": 0.9917315155268602, "No": 0.008268474077251496}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.3000765030901866e-07}, "ground_truth": 1}, {"key": "35971910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997732442829648, "res": {"Yes": 0.9997732442829648, "No": 0.0002267131490835168}, "ground_truth": 0}, {"key": "35971910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999961110815618, "res": {"Yes": 0.9999961110815618, "No": 3.800604214712497e-06}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0008178406865896572, "res": {"No": 0.9991818923327096, "Yes": 0.0008178406865896572}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993068663681752, "res": {"Yes": 0.9993068663681752, "No": 0.0006931128703213505}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999928926002577, "res": {"Yes": 0.9999928926002577, "No": 7.0695905037139836e-06}, "ground_truth": 1}, {"key": "34428424", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997803949167271, "res": {"Yes": 0.9997803949167271, "No": 0.00021953102312819334}, "ground_truth": 0}, {"key": "34428424", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00019047511535268553, "res": {"No": 0.9998092326084134, "Yes": 0.00019047511535268553}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9968389309326935, "res": {"Yes": 0.9968389309326935, "No": 0.003160953046060236}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9536593144973373, "res": {"Yes": 0.9536593144973373, "No": 0.04634059130114868}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999725091278809, "res": {"Yes": 0.9999725091278809, "No": 2.741736462127478e-05}, "ground_truth": 1}, {"key": "36971005", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 2.073170458418374e-06}, "ground_truth": 0}, {"key": "36971005", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.006339111894987765, "res": {"No": 0.9936605864112875, "Yes": 0.006339111894987765}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9685934707020069, "res": {"Yes": 0.9685934707020069, "No": 0.03140629275300194}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999838332276837, "res": {"Yes": 0.9999838332276837, "No": 1.6096945893891648e-05}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999621387467553, "res": {"Yes": 0.9999621387467553, "No": 3.783984159378934e-05}, "ground_truth": 1}, {"key": "34649067", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.359397587105094e-07}, "ground_truth": 0}, {"key": "34649067", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.830877000915563e-06}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.3367876340545856e-06, "res": {"No": 0.9999964686909351, "Yes": 3.3367876340545856e-06}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.820613904713011e-06}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999747739361825, "res": {"Yes": 0.9999747739361825, "No": 2.510049477172247e-05}, "ground_truth": 1}, {"key": "37355154", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999516492769339, "res": {"Yes": 0.9999516492769339, "No": 4.8260603146023125e-05}, "ground_truth": 0}, {"key": "37355154", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.978978346180619, "res": {"Yes": 0.978978346180619, "No": 0.021021711382134527}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 6.21726727260433e-05, "res": {"No": 0.9999374648254056, "Yes": 6.21726727260433e-05}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.990846611664333, "res": {"Yes": 0.990846611664333, "No": 0.009153380631570262}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998989651903601, "res": {"Yes": 0.9998989651903601, "No": 0.00010098677401947315}, "ground_truth": 1}, {"key": "38674697", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999734627301196, "res": {"Yes": 0.9999734627301196, "No": 2.6463662298305588e-05}, "ground_truth": 0}, {"key": "38674697", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.98421668779404, "res": {"Yes": 0.98421668779404, "No": 0.01578331357289899}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.2826648866419064e-06, "res": {"No": 0.9999956342685299, "Yes": 3.2826648866419064e-06}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.011947533781746912, "res": {"No": 0.9880523967427908, "Yes": 0.011947533781746912}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999663107274963, "res": {"Yes": 0.9999663107274963, "No": 3.362199809542829e-05}, "ground_truth": 1}, {"key": "40525767", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999909853566321, "res": {"Yes": 0.9999909853566321, "No": 8.960218008209979e-06}, "ground_truth": 0}, {"key": "40525767", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999295979043439, "res": {"Yes": 0.9999295979043439, "No": 7.030138908180366e-05}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.09965044168199899, "res": {"No": 0.9003495339489093, "Yes": 0.09965044168199899}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992006967131954, "res": {"Yes": 0.9992006967131954, "No": 0.0007993129594215657}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9907665703447288, "res": {"Yes": 0.9907665703447288, "No": 0.00923332921948679}, "ground_truth": 1}, {"key": "27165110", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998665529248532, "res": {"Yes": 0.9998665529248532, "No": 0.00013338738422258024}, "ground_truth": 0}, {"key": "27165110", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9043281198588404, "res": {"Yes": 0.9043281198588404, "No": 0.09567174209883263}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9993411554834252, "res": {"Yes": 0.9993411554834252, "No": 0.0006587441754298578}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9973783227141608, "res": {"Yes": 0.9973783227141608, "No": 0.0026216305695538904}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9938703822294341, "res": {"Yes": 0.9938703822294341, "No": 0.006129666102072478}, "ground_truth": 1}, {"key": "35497491", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999949190499081, "res": {"Yes": 0.9999949190499081, "No": 5.0191196909830715e-06}, "ground_truth": 0}, {"key": "35497491", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993192514145293, "res": {"Yes": 0.9993192514145293, "No": 0.0006807040008330651}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9852963964232885, "res": {"Yes": 0.9852963964232885, "No": 0.014703387052550865}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9526380462847611, "res": {"Yes": 0.9526380462847611, "No": 0.047361794428920294}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9854932921080455, "res": {"Yes": 0.9854932921080455, "No": 0.014506685019099411}, "ground_truth": 1}, {"key": "40690716", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8258930857308008, "res": {"Yes": 0.8258930857308008, "No": 0.1741067085866592}, "ground_truth": 0}, {"key": "40690716", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.26282848705913997, "res": {"No": 0.7371712889681701, "Yes": 0.26282848705913997}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00048619328858151236, "res": {"No": 0.9995135572816416, "Yes": 0.00048619328858151236}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998652418606938, "res": {"Yes": 0.9998652418606938, "No": 0.00013466854779419787}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9922689092095636, "res": {"Yes": 0.9922689092095636, "No": 0.00773103446985206}, "ground_truth": 1}, {"key": "34835193", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999789459686392, "res": {"Yes": 0.9999789459686392, "No": 2.098650386371913e-05}, "ground_truth": 0}, {"key": "34835193", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9842245428587709, "res": {"Yes": 0.9842245428587709, "No": 0.015775439664129726}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9843414166196479, "res": {"Yes": 0.9843414166196479, "No": 0.015658537242969343}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8579755125954451, "res": {"Yes": 0.8579755125954451, "No": 0.14202444333963476}, "ground_truth": 1}, {"key": "39471712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999739395305799, "res": {"Yes": 0.9999739395305799, "No": 2.5984535119616513e-05}, "ground_truth": 0}, {"key": "39471712", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9905574970672634, "res": {"Yes": 0.9905574970672634, "No": 0.009442407495846687}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.4671778961080052, "res": {"No": 0.5328220369336922, "Yes": 0.4671778961080052}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9574181161169139, "res": {"Yes": 0.9574181161169139, "No": 0.042581857359533765}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9816284713139607, "res": {"Yes": 0.9816284713139607, "No": 0.01837156849305906}, "ground_truth": 1}, {"key": "39115192", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9952155322048406, "res": {"Yes": 0.9952155322048406, "No": 0.0047844447524772234}, "ground_truth": 0}, {"key": "39115192", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999899125338788, "res": {"Yes": 0.9999899125338788, "No": 1.0067964567661395e-05}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 5.415231103655224e-06, "res": {"No": 0.999994561441089, "Yes": 5.415231103655224e-06}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997029545267453, "res": {"Yes": 0.9997029545267453, "No": 0.0002970277467870084}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987323566394913, "res": {"Yes": 0.9987323566394913, "No": 0.0012676199396918083}, "ground_truth": 1}, {"key": "23520673", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998958662122993, "res": {"Yes": 0.9998958662122993, "No": 0.00010404948028451585}, "ground_truth": 0}, {"key": "23520673", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999531988512079, "res": {"Yes": 0.9999531988512079, "No": 4.6741973818291276e-05}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9996831764491844, "res": {"Yes": 0.9996831764491844, "No": 0.00031674104837968106}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996184971307335, "res": {"Yes": 0.9996184971307335, "No": 0.000381475473100429}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999980183344636, "res": {"Yes": 0.9999980183344636, "No": 1.8715398813449344e-06}, "ground_truth": 1}, {"key": "35764233", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978134680512519, "res": {"Yes": 0.9978134680512519, "No": 0.002186507624582149}, "ground_truth": 0}, {"key": "35764233", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999695291212467, "res": {"Yes": 0.9999695291212467, "No": 3.0389968121987755e-05}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8218597573320049, "res": {"Yes": 0.8218597573320049, "No": 0.17814012843514088}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.015044512082014329, "res": {"No": 0.9849554817739544, "Yes": 0.015044512082014329}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999992773397112, "res": {"Yes": 0.999992773397112, "No": 7.102306269298518e-06}, "ground_truth": 1}, {"key": "35228910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.980067917644533, "res": {"Yes": 0.980067917644533, "No": 0.019932021896569323}, "ground_truth": 0}, {"key": "35228910", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9957882736019884, "res": {"Yes": 0.9957882736019884, "No": 0.004211686995630889}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.04366363387960032, "res": {"No": 0.9563359304215339, "Yes": 0.04366363387960032}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990607522695415, "res": {"Yes": 0.9990607522695415, "No": 0.0009390413908641166}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6365037496227907, "res": {"Yes": 0.6365037496227907, "No": 0.36349577688464474}, "ground_truth": 1}, {"key": "36795599", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995103550152511, "res": {"Yes": 0.9995103550152511, "No": 0.00048957328167377}, "ground_truth": 0}, {"key": "36795599", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9913220149786315, "res": {"Yes": 0.9913220149786315, "No": 0.008677750004357684}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00041867215107023, "res": {"No": 0.9995812122960609, "Yes": 0.00041867215107023}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999864556687252, "res": {"Yes": 0.9999864556687252, "No": 1.3447329793366905e-05}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999927452391705, "res": {"Yes": 0.999927452391705, "No": 7.251653160201306e-05}, "ground_truth": 1}, {"key": "38641949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997694306352025, "res": {"Yes": 0.9997694306352025, "No": 0.0002304575217336926}, "ground_truth": 0}, {"key": "38641949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999919389784903, "res": {"Yes": 0.9999919389784903, "No": 8.00159228871594e-06}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9599094306920051, "res": {"Yes": 0.9599094306920051, "No": 0.04009012637701754}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984950819265896, "res": {"Yes": 0.9984950819265896, "No": 0.001504737221019651}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9921527328322002, "res": {"Yes": 0.9921527328322002, "No": 0.007847068942764237}, "ground_truth": 1}, {"key": "29968443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999249975758899, "res": {"Yes": 0.999249975758899, "No": 0.0007499597646547327}, "ground_truth": 0}, {"key": "29968443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8415530459199656, "res": {"Yes": 0.8415530459199656, "No": 0.1584467823639937}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6617332631478887, "res": {"Yes": 0.6617332631478887, "No": 0.3382666463453378}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999920581810364, "res": {"Yes": 0.9999920581810364, "No": 7.866486794249554e-06}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985938531522247, "res": {"Yes": 0.9985938531522247, "No": 0.0014061047306451046}, "ground_truth": 1}, {"key": "21268042", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8890040658225561, "res": {"Yes": 0.8890040658225561, "No": 0.11099593499578352}, "ground_truth": 0}, {"key": "21268042", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999937270200753, "res": {"Yes": 0.9999937270200753, "No": 6.214010855826583e-06}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6581514874935516, "res": {"Yes": 0.6581514874935516, "No": 0.3418485076989021}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997644252520895, "res": {"Yes": 0.9997644252520895, "No": 0.00023553924805173252}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999932502087799, "res": {"Yes": 0.9999932502087799, "No": 6.644347930230484e-06}, "ground_truth": 1}, {"key": "26808572", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.029924346198724e-07}, "ground_truth": 0}, {"key": "26808572", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.2413954730994875e-07}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0013682503118792782, "res": {"No": 0.9986317714793166, "Yes": 0.0013682503118792782}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.00022142469582173968, "res": {"No": 0.9997784880673918, "Yes": 0.00022142469582173968}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.02372001671910985, "res": {"No": 0.9762799789776129, "Yes": 0.02372001671910985}, "ground_truth": 1}, {"key": "37829390", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.017974755099034456, "res": {"No": 0.9820252668194246, "Yes": 0.017974755099034456}, "ground_truth": 0}, {"key": "37829390", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.19227733424017135, "res": {"No": 0.8077225808080591, "Yes": 0.19227733424017135}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9718523007779661, "res": {"Yes": 0.9718523007779661, "No": 0.028147639000776218}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9862861573985258, "res": {"Yes": 0.9862861573985258, "No": 0.013713756854580667}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999716747231683, "res": {"Yes": 0.9999716747231683, "No": 2.8267042724224087e-05}, "ground_truth": 1}, {"key": "35716045", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999939654258081, "res": {"Yes": 0.9999939654258081, "No": 5.980478359342091e-06}, "ground_truth": 0}, {"key": "35716045", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993841349227964, "res": {"Yes": 0.9993841349227964, "No": 0.000615790961645742}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.07252780307105544, "res": {"No": 0.9274718457015783, "Yes": 0.07252780307105544}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0018192771993317542, "res": {"No": 0.9981806982394016, "Yes": 0.0018192771993317542}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.015323326557848871, "res": {"No": 0.9846764942393937, "Yes": 0.015323326557848871}, "ground_truth": 1}, {"key": "34367070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7363315177070239, "res": {"Yes": 0.7363315177070239, "No": 0.26366819590681173}, "ground_truth": 0}, {"key": "34367070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0010526607210292718, "res": {"No": 0.9989472624174173, "Yes": 0.0010526607210292718}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.22186788208737773, "res": {"No": 0.7781320648850005, "Yes": 0.22186788208737773}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9946331846878597, "res": {"Yes": 0.9946331846878597, "No": 0.005366805641840505}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.988219774643606, "res": {"Yes": 0.988219774643606, "No": 0.011780193202521777}, "ground_truth": 1}, {"key": "35239748", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8800085549702823, "res": {"Yes": 0.8800085549702823, "No": 0.11999138865300614}, "ground_truth": 0}, {"key": "35239748", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.015394108618446147, "res": {"No": 0.9846058713429089, "Yes": 0.015394108618446147}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999062359061275, "res": {"Yes": 0.9999062359061275, "No": 9.372477462372791e-05}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 1.997570231948345e-06}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.827073594080671e-06}, "ground_truth": 1}, {"key": "40421370", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998762071829632, "res": {"Yes": 0.9998762071829632, "No": 0.00012369892116329795}, "ground_truth": 0}, {"key": "40421370", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997093896353749, "res": {"Yes": 0.9997093896353749, "No": 0.0002906054653156358}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998008899750327, "res": {"Yes": 0.9998008899750327, "No": 0.0001990371633844281}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998990843823236, "res": {"Yes": 0.9998990843823236, "No": 0.00010087736366756033}, "ground_truth": 1}, {"key": "37288396", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999951574563252, "res": {"Yes": 0.9999951574563252, "No": 4.794649256799095e-06}, "ground_truth": 0}, {"key": "37288396", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989386960817931, "res": {"Yes": 0.9989386960817931, "No": 0.001061231449871589}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9993518731250197, "res": {"Yes": 0.9993518731250197, "No": 0.0006480880443053606}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.5047993363225388e-06}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 7.99614580295336e-07}, "ground_truth": 1}, {"key": "38903688", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999915813694369, "res": {"Yes": 0.9999915813694369, "No": 8.330525654458097e-06}, "ground_truth": 0}, {"key": "38903688", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.992599435537124, "res": {"Yes": 0.992599435537124, "No": 0.007400546723108266}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.0146031572512163e-06, "res": {"No": 0.99999861435166, "Yes": 1.0146031572512163e-06}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9933347599108157, "res": {"Yes": 0.9933347599108157, "No": 0.006665162130439445}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980073295092463, "res": {"Yes": 0.9980073295092463, "No": 0.001992676637574165}, "ground_truth": 1}, {"key": "28071228", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.09375607652175919, "res": {"No": 0.9062437585085032, "Yes": 0.09375607652175919}, "ground_truth": 0}, {"key": "28071228", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999878702827097, "res": {"Yes": 0.999878702827097, "No": 0.00012123921264267788}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9995259485179269, "res": {"Yes": 0.9995259485179269, "No": 0.00047399712580031367}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989325114716829, "res": {"Yes": 0.9989325114716829, "No": 0.0010673962577709317}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9963061617672446, "res": {"Yes": 0.9963061617672446, "No": 0.0036938500163204986}, "ground_truth": 1}, {"key": "36855834", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997284495365032, "res": {"Yes": 0.9997284495365032, "No": 0.00027153622556379004}, "ground_truth": 0}, {"key": "36855834", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9945281190775958, "res": {"Yes": 0.9945281190775958, "No": 0.005471931045912309}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.07836255347318165, "res": {"No": 0.9216372288212591, "Yes": 0.07836255347318165}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9815887200922745, "res": {"Yes": 0.9815887200922745, "No": 0.018411231370779824}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.50813033466981, "res": {"Yes": 0.50813033466981, "No": 0.49186971719764383}, "ground_truth": 1}, {"key": "40548717", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9404782843324151, "res": {"Yes": 0.9404782843324151, "No": 0.05952167780062573}, "ground_truth": 0}, {"key": "40548717", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.1545094839096208, "res": {"No": 0.8454903365343047, "Yes": 0.1545094839096208}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8092405287356778, "res": {"Yes": 0.8092405287356778, "No": 0.19075932958509925}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.7687101603363495e-06}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 7.11799969296055e-08}, "ground_truth": 1}, {"key": "37051175", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999931310055916, "res": {"Yes": 0.9999931310055916, "No": 6.7574024142673104e-06}, "ground_truth": 0}, {"key": "37051175", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4697003815838038e-06}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9992566388299146, "res": {"Yes": 0.9992566388299146, "No": 0.000743266200117518}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999763235462916, "res": {"Yes": 0.9999763235462916, "No": 2.3571316209501524e-05}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9963065177474999, "res": {"Yes": 0.9963065177474999, "No": 0.0036934289414203604}, "ground_truth": 1}, {"key": "38882119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999928926002577, "res": {"Yes": 0.9999928926002577, "No": 6.984389295007415e-06}, "ground_truth": 0}, {"key": "38882119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9955144555393382, "res": {"Yes": 0.9955144555393382, "No": 0.004485505862395051}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.014357962681134708, "res": {"No": 0.9856419649845297, "Yes": 0.014357962681134708}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992445001338468, "res": {"Yes": 0.9992445001338468, "No": 0.0007554660608703349}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 5.7282309249308986e-08}, "ground_truth": 1}, {"key": "19485402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.1634421861709374e-06}, "ground_truth": 0}, {"key": "19485402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.5043267537739325, "res": {"Yes": 0.5043267537739325, "No": 0.4956733191478641}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8957411382073147, "res": {"Yes": 0.8957411382073147, "No": 0.10425871757258055}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997756278152045, "res": {"Yes": 0.9997756278152045, "No": 0.00022427961574337951}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8507792880842816, "res": {"Yes": 0.8507792880842816, "No": 0.149220679241849}, "ground_truth": 1}, {"key": "36060907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999814491960682, "res": {"Yes": 0.9999814491960682, "No": 1.8506232328325708e-05}, "ground_truth": 0}, {"key": "36060907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6160140298361155, "res": {"Yes": 0.6160140298361155, "No": 0.3839859175936814}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.846865461945458e-07, "res": {"No": 0.9999993295729247, "Yes": 3.846865461945458e-07}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996911606007087, "res": {"Yes": 0.9996911606007087, "No": 0.0003087693499756445}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9268742085324515, "res": {"Yes": 0.9268742085324515, "No": 0.07312565618502138}, "ground_truth": 1}, {"key": "24037309", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999766811478886, "res": {"Yes": 0.9999766811478886, "No": 2.322688764827168e-05}, "ground_truth": 0}, {"key": "24037309", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00010915223486567162, "res": {"No": 0.9998907410091983, "Yes": 0.00010915223486567162}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9993065089761315, "res": {"Yes": 0.9993065089761315, "No": 0.0006934457137030523}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999900317366834, "res": {"Yes": 0.9999900317366834, "No": 9.854572473352444e-06}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9546600580760908, "res": {"Yes": 0.9546600580760908, "No": 0.04533985644937812}, "ground_truth": 1}, {"key": "35605805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987864537435287, "res": {"Yes": 0.9987864537435287, "No": 0.0012134909385837407}, "ground_truth": 0}, {"key": "35605805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9071484053822566, "res": {"Yes": 0.9071484053822566, "No": 0.09285150336355134}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0020718434758123312, "res": {"No": 0.9979281432643249, "Yes": 0.0020718434758123312}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9085281377217868, "res": {"Yes": 0.9085281377217868, "No": 0.09147177721660413}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9671054198942785, "res": {"Yes": 0.9671054198942785, "No": 0.032894549619354375}, "ground_truth": 1}, {"key": "17706248", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998451030377734, "res": {"Yes": 0.9998451030377734, "No": 0.00015484406185561293}, "ground_truth": 0}, {"key": "17706248", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999791843696483, "res": {"Yes": 0.9999791843696483, "No": 2.0768284885801742e-05}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.18976145416923784, "res": {"No": 0.8102385406832642, "Yes": 0.18976145416923784}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999709595226828, "res": {"Yes": 0.9999709595226828, "No": 2.898920612061052e-05}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999232805730858, "res": {"Yes": 0.9999232805730858, "No": 7.662953355322732e-05}, "ground_truth": 1}, {"key": "36883559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998238882994865, "res": {"Yes": 0.9998238882994865, "No": 0.00017605748446063345}, "ground_truth": 0}, {"key": "36883559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.15738507021612497, "res": {"No": 0.8426148631208905, "Yes": 0.15738507021612497}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 9.554703611096297e-06, "res": {"No": 0.9999903893441826, "Yes": 9.554703611096297e-06}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9840041514357628, "res": {"Yes": 0.9840041514357628, "No": 0.015995849446317562}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0498845222345203, "res": {"No": 0.9501153753736462, "Yes": 0.0498845222345203}, "ground_truth": 1}, {"key": "32799471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.4388030235973871, "res": {"No": 0.5611969306674436, "Yes": 0.4388030235973871}, "ground_truth": 0}, {"key": "32799471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.47891054148733553, "res": {"No": 0.521089404616315, "Yes": 0.47891054148733553}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00043019429607221704, "res": {"No": 0.9995696618220472, "Yes": 0.00043019429607221704}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 6.249495521636308e-08}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 7.499007991186983e-08}, "ground_truth": 1}, {"key": "34797243", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.6924693431109392e-08}, "ground_truth": 0}, {"key": "34797243", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999965878943212, "res": {"Yes": 0.9999965878943212, "No": 3.3790261881358203e-06}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 4.492963314275522e-05, "res": {"No": 0.9999549868231234, "Yes": 4.492963314275522e-05}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999955150656573, "res": {"Yes": 0.9999955150656573, "No": 4.368711253572066e-06}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998850198707218, "res": {"Yes": 0.9998850198707218, "No": 0.00011491865818504161}, "ground_truth": 1}, {"key": "32154876", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999822836059372, "res": {"Yes": 0.9999822836059372, "No": 1.758664061702107e-05}, "ground_truth": 0}, {"key": "32154876", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.863525499903179e-06}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9287566154635294, "res": {"Yes": 0.9287566154635294, "No": 0.07124334982349725}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 6.679363181933748e-07}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999894357248024, "res": {"Yes": 0.9999894357248024, "No": 1.0470906040567418e-05}, "ground_truth": 1}, {"key": "37962274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994536690931081, "res": {"Yes": 0.9994536690931081, "No": 0.0005462691800233496}, "ground_truth": 0}, {"key": "37962274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999877668918251, "res": {"Yes": 0.9999877668918251, "No": 1.211732877156652e-05}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9957894533130549, "res": {"Yes": 0.9957894533130549, "No": 0.004210486835868024}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.156308125017947e-06}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993571110417191, "res": {"Yes": 0.9993571110417191, "No": 0.000642893356830736}, "ground_truth": 1}, {"key": "35574030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974339414712527, "res": {"Yes": 0.9974339414712527, "No": 0.0025660015724162663}, "ground_truth": 0}, {"key": "35574030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999093349203267, "res": {"Yes": 0.9999093349203267, "No": 9.060428955087328e-05}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.011211525133416016, "res": {"No": 0.9887883325044259, "Yes": 0.011211525133416016}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9330135455180897, "res": {"Yes": 0.9330135455180897, "No": 0.06698639767356614}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.25186181375225225, "res": {"No": 0.7481380942995108, "Yes": 0.25186181375225225}, "ground_truth": 1}, {"key": "39105949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9973077678746056, "res": {"Yes": 0.9973077678746056, "No": 0.0026921719359919503}, "ground_truth": 0}, {"key": "39105949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9937639444113443, "res": {"Yes": 0.9937639444113443, "No": 0.006236055673925801}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.38142648373960253, "res": {"No": 0.6185733319439514, "Yes": 0.38142648373960253}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.02426660872879775, "res": {"No": 0.9757332932748458, "Yes": 0.02426660872879775}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.0016817612022725402, "res": {"No": 0.9983182603116513, "Yes": 0.0016817612022725402}, "ground_truth": 1}, {"key": "41064322", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.010391196725434128, "res": {"No": 0.9896087282153497, "Yes": 0.010391196725434128}, "ground_truth": 0}, {"key": "41064322", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.010961972949744101, "res": {"No": 0.9890379292327665, "Yes": 0.010961972949744101}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.2736607714569666, "res": {"No": 0.7263389861938508, "Yes": 0.2736607714569666}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 7.164324914454101e-09}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999512916842885, "res": {"Yes": 0.9999512916842885, "No": 4.867714207354752e-05}, "ground_truth": 1}, {"key": "28105101", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 4.051866547842932e-07}, "ground_truth": 0}, {"key": "28105101", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999983475621529, "res": {"Yes": 0.999983475621529, "No": 1.6468040413453934e-05}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.1938915687779415, "res": {"No": 0.8061084356328283, "Yes": 0.1938915687779415}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992921064749292, "res": {"Yes": 0.9992921064749292, "No": 0.000707889889266851}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994178273782804, "res": {"Yes": 0.9994178273782804, "No": 0.0005820900483210294}, "ground_truth": 1}, {"key": "36036068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999748931371826, "res": {"Yes": 0.9999748931371826, "No": 2.505440243416616e-05}, "ground_truth": 0}, {"key": "36036068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999843100330889, "res": {"Yes": 0.9999843100330889, "No": 1.5640794889527887e-05}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00012619565978620883, "res": {"No": 0.9998735850310456, "Yes": 0.00012619565978620883}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.1341711708234805, "res": {"No": 0.8658287225033288, "Yes": 0.1341711708234805}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 8.3196795956417e-08}, "ground_truth": 1}, {"key": "37991460", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998564220183052, "res": {"Yes": 0.9998564220183052, "No": 0.0001435490168864347}, "ground_truth": 0}, {"key": "37991460", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.5891079708446677, "res": {"Yes": 0.5891079708446677, "No": 0.4108920052345974}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 9.82135062364546e-07, "res": {"No": 0.9999987335551019, "Yes": 9.82135062364546e-07}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 1.0026851565567237e-06}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997894487690223, "res": {"Yes": 0.9997894487690223, "No": 0.00021046335615905717}, "ground_truth": 1}, {"key": "38437830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9942892864713506, "res": {"Yes": 0.9942892864713506, "No": 0.005710739808766229}, "ground_truth": 0}, {"key": "38437830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.2101527146366752, "res": {"No": 0.7898472552499783, "Yes": 0.2101527146366752}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00024979574351240944, "res": {"No": 0.9997501352813897, "Yes": 0.00024979574351240944}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 1.1547299013373589e-05, "res": {"No": 0.9999882437011058, "Yes": 1.1547299013373589e-05}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.996952552423797, "res": {"Yes": 0.996952552423797, "No": 0.003047450315820474}, "ground_truth": 1}, {"key": "36507138", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9935966716471987, "res": {"Yes": 0.9935966716471987, "No": 0.00640327756611234}, "ground_truth": 0}, {"key": "36507138", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.07799608077728534, "res": {"No": 0.9220037243578729, "Yes": 0.07799608077728534}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.191852486350142e-05, "res": {"No": 0.9999679795226665, "Yes": 3.191852486350142e-05}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.02971023439819605, "res": {"No": 0.970289681837004, "Yes": 0.02971023439819605}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9976812779986143, "res": {"Yes": 0.9976812779986143, "No": 0.002318675874477119}, "ground_truth": 1}, {"key": "37824866", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.11437934122971141, "res": {"No": 0.8856205670480953, "Yes": 0.11437934122971141}, "ground_truth": 0}, {"key": "37824866", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.4075802227632651, "res": {"No": 0.5924197607725976, "Yes": 0.4075802227632651}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9938430646859923, "res": {"Yes": 0.9938430646859923, "No": 0.006156891225568576}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999757275415809, "res": {"Yes": 0.9999757275415809, "No": 2.421060010105371e-05}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9974261124434852, "res": {"Yes": 0.9974261124434852, "No": 0.002573822837183458}, "ground_truth": 1}, {"key": "25088134", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998636924207224, "res": {"Yes": 0.9998636924207224, "No": 0.00013623748252738425}, "ground_truth": 0}, {"key": "25088134", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999419942923962, "res": {"Yes": 0.9999419942923962, "No": 5.7877607070380105e-05}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998978924633294, "res": {"Yes": 0.9998978924633294, "No": 0.00010208742540263699}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999032311662633, "res": {"Yes": 0.999032311662633, "No": 0.0009676477805210748}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.5919736853204803e-06}, "ground_truth": 1}, {"key": "40172531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999961110815618, "res": {"Yes": 0.9999961110815618, "No": 3.847649944742166e-06}, "ground_truth": 0}, {"key": "40172531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9027392201682426, "res": {"Yes": 0.9027392201682426, "No": 0.09726068802030545}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999509340887712, "res": {"Yes": 0.9999509340887712, "No": 4.897424550350835e-05}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9533987588755678, "res": {"Yes": 0.9533987588755678, "No": 0.04660124600049263}, "ground_truth": 1}, {"key": "37035874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9582312364235591, "res": {"Yes": 0.9582312364235591, "No": 0.04176868428548172}, "ground_truth": 0}, {"key": "37035874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9909942251151058, "res": {"Yes": 0.9909942251151058, "No": 0.009005696116594413}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999889589149532, "res": {"Yes": 0.9999889589149532, "No": 1.0925074475788974e-05}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9904618217583158, "res": {"Yes": 0.9904618217583158, "No": 0.009538147450093746}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9907895048747424, "res": {"Yes": 0.9907895048747424, "No": 0.00921039722403025}, "ground_truth": 1}, {"key": "36404465", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998895490961502, "res": {"Yes": 0.9998895490961502, "No": 0.00011039408538143107}, "ground_truth": 0}, {"key": "36404465", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6094360668404151, "res": {"Yes": 0.6094360668404151, "No": 0.3905638830986325}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.025413691874902486, "res": {"No": 0.9745860706999259, "Yes": 0.025413691874902486}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.5698003173321523, "res": {"Yes": 0.5698003173321523, "No": 0.43019972559637537}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999448550185404, "res": {"Yes": 0.9999448550185404, "No": 5.501393726583618e-05}, "ground_truth": 1}, {"key": "39602052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9852561281824537, "res": {"Yes": 0.9852561281824537, "No": 0.014743790026509043}, "ground_truth": 0}, {"key": "39602052", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8631794949605339, "res": {"Yes": 0.8631794949605339, "No": 0.13682043586122944}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.16761265275814252, "res": {"No": 0.8323872930637056, "Yes": 0.16761265275814252}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.976267481697591, "res": {"Yes": 0.976267481697591, "No": 0.023732472997374326}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999881244990143, "res": {"Yes": 0.9999881244990143, "No": 1.182116487095407e-05}, "ground_truth": 1}, {"key": "33792789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990960937396086, "res": {"Yes": 0.9990960937396086, "No": 0.0009038230119330883}, "ground_truth": 0}, {"key": "33792789", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6170692035630472, "res": {"Yes": 0.6170692035630472, "No": 0.3829307176611009}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9314795062385132, "res": {"Yes": 0.9314795062385132, "No": 0.06852045261215131}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9390055023437891, "res": {"Yes": 0.9390055023437891, "No": 0.06099440136027841}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5072102332989786, "res": {"Yes": 0.5072102332989786, "No": 0.4927897531992536}, "ground_truth": 1}, {"key": "32776626", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997258277620793, "res": {"Yes": 0.9997258277620793, "No": 0.00027411961383280416}, "ground_truth": 0}, {"key": "32776626", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9673803335318186, "res": {"Yes": 0.9673803335318186, "No": 0.0326195818726458}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9242867684734586, "res": {"Yes": 0.9242867684734586, "No": 0.07571308349388474}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998853774396677, "res": {"Yes": 0.9998853774396677, "No": 0.00011451748948965702}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999976607241361, "res": {"Yes": 0.9999976607241361, "No": 2.2799478227923083e-06}, "ground_truth": 1}, {"key": "37195090", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999841908319662, "res": {"Yes": 0.9999841908319662, "No": 1.572332939206357e-05}, "ground_truth": 0}, {"key": "37195090", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999947998470209, "res": {"Yes": 0.9999947998470209, "No": 5.097634241870131e-06}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.13197828203106657, "res": {"No": 0.868021582499627, "Yes": 0.13197828203106657}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999531988512079, "res": {"Yes": 0.9999531988512079, "No": 4.672164548141408e-05}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.05014714978439312, "res": {"No": 0.9498527627292541, "Yes": 0.05014714978439312}, "ground_truth": 1}, {"key": "33981824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7474661193715257, "res": {"Yes": 0.7474661193715257, "No": 0.2525337691502758}, "ground_truth": 0}, {"key": "33981824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9963032106131338, "res": {"Yes": 0.9963032106131338, "No": 0.0036968136723007803}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7692880824946291, "res": {"Yes": 0.7692880824946291, "No": 0.23071181532677168}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7428182653078305, "res": {"Yes": 0.7428182653078305, "No": 0.25718158169782895}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.16624295105736694, "res": {"No": 0.8337569049395755, "Yes": 0.16624295105736694}, "ground_truth": 1}, {"key": "39569142", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8034683698845546, "res": {"Yes": 0.8034683698845546, "No": 0.1965314322313985}, "ground_truth": 0}, {"key": "39569142", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.013018970708153624, "res": {"No": 0.9869809091851551, "Yes": 0.013018970708153624}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 6.100914335170698e-07, "res": {"No": 0.9999992103693117, "Yes": 6.100914335170698e-07}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997475134600927, "res": {"Yes": 0.9997475134600927, "No": 0.0002523647743081471}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999959918780326, "res": {"Yes": 0.9999959918780326, "No": 3.971149335499921e-06}, "ground_truth": 1}, {"key": "40268210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999675027220479, "res": {"Yes": 0.9999675027220479, "No": 3.237027482331218e-05}, "ground_truth": 0}, {"key": "40268210", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.622181620737242e-07}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.00036481470165017723, "res": {"No": 0.9996351647685646, "Yes": 0.00036481470165017723}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997887336898705, "res": {"Yes": 0.9997887336898705, "No": 0.00021122154479394576}, "ground_truth": 1}, {"key": "34925159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994522394456187, "res": {"Yes": 0.9994522394456187, "No": 0.0005477623680545662}, "ground_truth": 0}, {"key": "34925159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.026499630221313904, "res": {"No": 0.9735002805334212, "Yes": 0.026499630221313904}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998695326316075, "res": {"Yes": 0.9998695326316075, "No": 0.00013040429133532284}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999723899261651, "res": {"Yes": 0.9999723899261651, "No": 2.756080233340519e-05}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999588011756949, "res": {"Yes": 0.9999588011756949, "No": 4.1095332803608414e-05}, "ground_truth": 1}, {"key": "36181903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.00032098312702526623, "res": {"No": 0.9996788901668019, "Yes": 0.00032098312702526623}, "ground_truth": 0}, {"key": "36181903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.004599205535854297, "res": {"No": 0.9954008130009299, "Yes": 0.004599205535854297}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8561036103813809, "res": {"Yes": 0.8561036103813809, "No": 0.14389629679393154}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.000837212614515976, "res": {"No": 0.9991626083382539, "Yes": 0.000837212614515976}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.992522738853113, "res": {"Yes": 0.992522738853113, "No": 0.007477184212851723}, "ground_truth": 1}, {"key": "38620559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9989802145349808, "res": {"Yes": 0.9989802145349808, "No": 0.0010197858751980332}, "ground_truth": 0}, {"key": "38620559", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9245165747278349, "res": {"Yes": 0.9245165747278349, "No": 0.07548328786581203}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9937336865486631, "res": {"Yes": 0.9937336865486631, "No": 0.006266244920495596}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.04963111119750722, "res": {"No": 0.9503688657611941, "Yes": 0.04963111119750722}, "ground_truth": 1}, {"key": "32719657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.035446838922786855, "res": {"No": 0.9645531190204516, "Yes": 0.035446838922786855}, "ground_truth": 0}, {"key": "32719657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.331792081508109e-05, "res": {"No": 0.9999865748701179, "Yes": 1.331792081508109e-05}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.323446892458785e-05, "res": {"No": 0.9999666683255126, "Yes": 3.323446892458785e-05}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998088750666976, "res": {"Yes": 0.9998088750666976, "No": 0.00019109707747616645}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985655595945422, "res": {"Yes": 0.9985655595945422, "No": 0.0014343822647194973}, "ground_truth": 1}, {"key": "37530914", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999233997739472, "res": {"Yes": 0.9999233997739472, "No": 7.656082768082061e-05}, "ground_truth": 0}, {"key": "37530914", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.5622713030118031, "res": {"Yes": 0.5622713030118031, "No": 0.43772864174259324}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0029455862955850543, "res": {"No": 0.9970542229408715, "Yes": 0.0029455862955850543}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9515846266011354, "res": {"Yes": 0.9515846266011354, "No": 0.048415270927159124}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9915058657534479, "res": {"Yes": 0.9915058657534479, "No": 0.008494095533328676}, "ground_truth": 1}, {"key": "33306933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7716842848897035, "res": {"Yes": 0.7716842848897035, "No": 0.2283157590532918}, "ground_truth": 0}, {"key": "33306933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8632651266136938, "res": {"Yes": 0.8632651266136938, "No": 0.1367348677650459}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.1410934381708774e-07}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.00952738114723924, "res": {"No": 0.9904725782321075, "Yes": 0.00952738114723924}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.6204235374821546e-06}, "ground_truth": 1}, {"key": "33837212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, " Yes": 5.402121987050817e-09}, "ground_truth": 0}, {"key": "33837212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0001641000098243767, "res": {"No": 0.9998358066312069, "Yes": 0.0001641000098243767}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.006205044429979208, "res": {"No": 0.9937949066031229, "Yes": 0.006205044429979208}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999913429644723, "res": {"Yes": 0.9999913429644723, "No": 8.57894167478106e-06}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.975867695155704, "res": {"Yes": 0.975867695155704, "No": 0.024132207980212424}, "ground_truth": 1}, {"key": "40945179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999837140256179, "res": {"Yes": 0.9999837140256179, "No": 1.6189802325754663e-05}, "ground_truth": 0}, {"key": "40945179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9858734100451604, "res": {"Yes": 0.9858734100451604, "No": 0.014126549625035444}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0031697524044344803, "res": {"No": 0.9968302933607792, "Yes": 0.0031697524044344803}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999442590335854, "res": {"Yes": 0.9999442590335854, "No": 5.568682355319115e-05}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999975415208221, "res": {"Yes": 0.9999975415208221, "No": 2.352723416916157e-06}, "ground_truth": 1}, {"key": "34152358", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.519055574664646e-07}, "ground_truth": 0}, {"key": "34152358", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999950382530095, "res": {"Yes": 0.9999950382530095, "No": 4.883252813540625e-06}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0019771695049531925, "res": {"No": 0.9980227660075927, "Yes": 0.0019771695049531925}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7699226297708661, "res": {"Yes": 0.7699226297708661, "No": 0.2300773781266695}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999994561441089, "res": {"Yes": 0.999994561441089, "No": 5.357822046853879e-06}, "ground_truth": 1}, {"key": "34136541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 2.0836924952976174e-06}, "ground_truth": 0}, {"key": "34136541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8602072761464505, "res": {"Yes": 0.8602072761464505, "No": 0.13979270950580758}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9996356414147175, "res": {"Yes": 0.9996356414147175, "No": 0.00036429885389569893}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9743707587205932, "res": {"Yes": 0.9743707587205932, "No": 0.025629152650483166}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999868132749457, "res": {"Yes": 0.9999868132749457, "No": 1.3110344275593768e-05}, "ground_truth": 1}, {"key": "37469603", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4473720864572844e-06}, "ground_truth": 0}, {"key": "37469603", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9390920169059521, "res": {"Yes": 0.9390920169059521, "No": 0.060907936046855946}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6938181253777299, "res": {"Yes": 0.6938181253777299, "No": 0.3061816578706603}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9829743812256179, "res": {"Yes": 0.9829743812256179, "No": 0.017025449924710247}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998905026252752, "res": {"Yes": 0.9998905026252752, "No": 0.00010930471779386452}, "ground_truth": 1}, {"key": "37353611", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982973490575597, "res": {"Yes": 0.9982973490575597, "No": 0.0017025298279601745}, "ground_truth": 0}, {"key": "37353611", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6725273629045415, "res": {"Yes": 0.6725273629045415, "No": 0.32747243348972377}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.1818771354171651, "res": {"No": 0.8181228502304658, "Yes": 0.1818771354171651}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999757275415809, "res": {"Yes": 0.9999757275415809, "No": 2.4188723608226926e-05}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999783255162557, "res": {"Yes": 0.999783255162557, "No": 0.00021652176162157213}, "ground_truth": 1}, {"key": "37211649", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999976607241361, "res": {"Yes": 0.9999976607241361, "No": 2.2929347744526504e-06}, "ground_truth": 0}, {"key": "37211649", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999810662776555, "res": {"Yes": 0.999810662776555, "No": 0.00018928343692713225}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9879366141608267, "res": {"Yes": 0.9879366141608267, "No": 0.012063273379615526}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.3769758079911635e-07}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 1.8555824777685878e-07}, "ground_truth": 1}, {"key": "37320976", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9985219451006797, "res": {"Yes": 0.9985219451006797, "No": 0.0014780160459292569}, "ground_truth": 0}, {"key": "37320976", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 8.480562193014596e-08}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.3266799282911547, "res": {"No": 0.6733200198166537, "Yes": 0.3266799282911547}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996507711745873, "res": {"Yes": 0.9996507711745873, "No": 0.00034911663286540516}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2588891503043055, "res": {"No": 0.7411108053351678, "Yes": 0.2588891503043055}, "ground_truth": 1}, {"key": "34492412", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999870516788303, "res": {"Yes": 0.9999870516788303, "No": 1.2908119835518259e-05}, "ground_truth": 0}, {"key": "34492412", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.045600787175052206, "res": {"No": 0.9543989522587574, "Yes": 0.045600787175052206}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9976514973576445, "res": {"Yes": 0.9976514973576445, "No": 0.002348497774790785}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990620622388586, "res": {"Yes": 0.9990620622388586, "No": 0.0009379433549130952}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999499805090164, "res": {"Yes": 0.9999499805090164, "No": 4.994051304188083e-05}, "ground_truth": 1}, {"key": "36655016", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998914561513098, "res": {"Yes": 0.9998914561513098, "No": 0.00010847693372294325}, "ground_truth": 0}, {"key": "36655016", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.2651261310514567, "res": {"No": 0.7348737964665958, "Yes": 0.2651261310514567}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0014954405997615829, "res": {"No": 0.9985044703207346, "Yes": 0.0014954405997615829}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8952363923961607, "res": {"Yes": 0.8952363923961607, "No": 0.10476354716478546}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999917005724405, "res": {"Yes": 0.9999917005724405, "No": 8.248402605012572e-06}, "ground_truth": 1}, {"key": "35220773", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999921773835968, "res": {"Yes": 0.9999921773835968, "No": 7.722194288908014e-06}, "ground_truth": 0}, {"key": "35220773", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999967070975216, "res": {"Yes": 0.9999967070975216, "No": 3.238455627424449e-06}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7605672823446606, "res": {"Yes": 0.7605672823446606, "No": 0.23943270088765703}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995028525187819, "res": {"Yes": 0.9995028525187819, "No": 0.0004970610511876585}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.1458266487567064, "res": {"No": 0.8541732388241776, "Yes": 0.1458266487567064}, "ground_truth": 1}, {"key": "31569808", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9125211095861787, "res": {"Yes": 0.9125211095861787, "No": 0.08747882630389757}, "ground_truth": 0}, {"key": "31569808", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.7874055043172853, "res": {"Yes": 0.7874055043172853, "No": 0.21259451777027916}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00851951384683111, "res": {"No": 0.9914803179509516, "Yes": 0.00851951384683111}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9961048174809756, "res": {"Yes": 0.9961048174809756, "No": 0.0038951328204380156}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9902669150801469, "res": {"Yes": 0.9902669150801469, "No": 0.009732966961755287}, "ground_truth": 1}, {"key": "37696256", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9831017878763877, "res": {"Yes": 0.9831017878763877, "No": 0.016898236696193305}, "ground_truth": 0}, {"key": "37696256", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9678187344887879, "res": {"Yes": 0.9678187344887879, "No": 0.03218115648688847}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997790839555438, "res": {"Yes": 0.9997790839555438, "No": 0.00022084090556697203}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999649995325307, "res": {"Yes": 0.9999649995325307, "No": 3.487382535385065e-05}, "ground_truth": 1}, {"key": "36874328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991920054035751, "res": {"Yes": 0.9991920054035751, "No": 0.000807993939572817}, "ground_truth": 0}, {"key": "36874328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0036361396347780227, "res": {"No": 0.9963636740047618, "Yes": 0.0036361396347780227}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999974223173222, "res": {"Yes": 0.9999974223173222, "No": 2.549360537116927e-06}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 1.4253804263516357e-08}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.45466742791606e-07}, "ground_truth": 1}, {"key": "24532377", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 6.941026338374637e-07}, "ground_truth": 0}, {"key": "24532377", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999968263007362, "res": {"Yes": 0.9999968263007362, "No": 3.073308159959428e-06}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.842481967325023e-06}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9961696220843091, "res": {"Yes": 0.9961696220843091, "No": 0.003830345388846723}, "ground_truth": 1}, {"key": "39560618", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 9.009376217182706e-09}, "ground_truth": 0}, {"key": "39560618", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8861551330218943, "res": {"Yes": 0.8861551330218943, "No": 0.11384486394073516}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 5.306025480792926e-06, "res": {"No": 0.999994561441089, "Yes": 5.306025480792926e-06}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.652777048120313e-07}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999785883642324, "res": {"Yes": 0.9999785883642324, "No": 2.1311451513035435e-05}, "ground_truth": 1}, {"key": "34922693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999882437011058, "res": {"Yes": 0.9999882437011058, "No": 1.1693879180681173e-05}, "ground_truth": 0}, {"key": "34922693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 3.312326272675888e-08}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7719093176814601, "res": {"Yes": 0.7719093176814601, "No": 0.2280906594259494}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.997050902556427, "res": {"Yes": 0.997050902556427, "No": 0.002949151727443485}, "ground_truth": 1}, {"key": "33629577", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999915813694369, "res": {"Yes": 0.9999915813694369, "No": 8.297917319584673e-06}, "ground_truth": 0}, {"key": "33629577", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9738312022530945, "res": {"Yes": 0.9738312022530945, "No": 0.026168732419756452}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0471711217954661, "res": {"No": 0.9528288092401643, "Yes": 0.0471711217954661}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990722932562269, "res": {"Yes": 0.9990722932562269, "No": 0.0009276874328162157}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.766140324486626e-06}, "ground_truth": 1}, {"key": "32284359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999944422379444, "res": {"Yes": 0.9999944422379444, "No": 5.51244111133164e-06}, "ground_truth": 0}, {"key": "32284359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9973266153743557, "res": {"Yes": 0.9973266153743557, "No": 0.0026734230138675337}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.999995276659155, "res": {"Yes": 0.999995276659155, "No": 4.589910651433089e-06}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9986957330963703, "res": {"Yes": 0.9986957330963703, "No": 0.0013041935481453038}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999413983091462, "res": {"Yes": 0.9999413983091462, "No": 5.849577667045426e-05}, "ground_truth": 1}, {"key": "28082962", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.2552452919399506e-08}, "ground_truth": 0}, {"key": "28082962", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.6096487949493315e-07}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.366106208689808, "res": {"No": 0.6338937407070723, "Yes": 0.366106208689808}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9163794897338499, "res": {"Yes": 0.9163794897338499, "No": 0.08362048107173571}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 1.021927508209872e-06}, "ground_truth": 1}, {"key": "24796803", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999595163694843, "res": {"Yes": 0.9999595163694843, "No": 4.0448985302625035e-05}, "ground_truth": 0}, {"key": "24796803", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.982450006993995, "res": {"Yes": 0.982450006993995, "No": 0.017550023325198602}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.001710849924629427, "res": {"No": 0.9982891599581637, "Yes": 0.001710849924629427}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997037887092296, "res": {"Yes": 0.9997037887092296, "No": 0.00029616257930986385}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9800632260706406, "res": {"Yes": 0.9800632260706406, "No": 0.019936640681108286}, "ground_truth": 1}, {"key": "35466150", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999835948245663, "res": {"Yes": 0.9999835948245663, "No": 1.6382645248425573e-05}, "ground_truth": 0}, {"key": "35466150", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9903468724587063, "res": {"Yes": 0.9903468724587063, "No": 0.009653072698133204}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999398487531588, "res": {"Yes": 0.9999398487531588, "No": 6.01316639952702e-05}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 1.1240852097275627e-06}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.779698457044157e-07}, "ground_truth": 1}, {"key": "35754289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 4.069872792094284e-08}, "ground_truth": 0}, {"key": "35754289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999804955832136, "res": {"Yes": 0.9999804955832136, "No": 1.9449620493353973e-05}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9688070206703034, "res": {"Yes": 0.9688070206703034, "No": 0.031192780661367905}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9778249624160267, "res": {"Yes": 0.9778249624160267, "No": 0.022174735027773607}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8342226298332743, "res": {"Yes": 0.8342226298332743, "No": 0.16577709403780316}, "ground_truth": 1}, {"key": "36678662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8377758385895014, "res": {"Yes": 0.8377758385895014, "No": 0.16222388364843257}, "ground_truth": 0}, {"key": "36678662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.30101114149040725, "res": {"No": 0.6989886740188396, "Yes": 0.30101114149040725}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9978147764849105, "res": {"Yes": 0.9978147764849105, "No": 0.0021852100987999486}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.3331149677792288, "res": {"No": 0.6668849744746993, "Yes": 0.3331149677792288}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998313150632376, "res": {"Yes": 0.998313150632376, "No": 0.0016868024224015044}, "ground_truth": 1}, {"key": "35399671", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9136589931300205, "res": {"Yes": 0.9136589931300205, "No": 0.08634091424656432}, "ground_truth": 0}, {"key": "35399671", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.20856275496166873, "res": {"No": 0.7914371966985017, "Yes": 0.20856275496166873}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999778731568022, "res": {"Yes": 0.9999778731568022, "No": 2.2009178215335974e-05}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9904990147932579, "res": {"Yes": 0.9904990147932579, "No": 0.00950088810507815}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9970555265901202, "res": {"Yes": 0.9970555265901202, "No": 0.0029444889745749176}, "ground_truth": 1}, {"key": "36888180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988672138871328, "res": {"Yes": 0.9988672138871328, "No": 0.001132722785347812}, "ground_truth": 0}, {"key": "36888180", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998768031293578, "res": {"Yes": 0.9998768031293578, "No": 0.0001230848011380237}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0007020743133979144, "res": {"No": 0.9992977050546176, "Yes": 0.0007020743133979144}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9434086181228697, "res": {"Yes": 0.9434086181228697, "No": 0.056591300896122125}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9981030341184178, "res": {"Yes": 0.9981030341184178, "No": 0.0018969631758489214}, "ground_truth": 1}, {"key": "28061069", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997720525239746, "res": {"Yes": 0.9997720525239746, "No": 0.00022792521208278587}, "ground_truth": 0}, {"key": "28061069", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9910802768795559, "res": {"Yes": 0.9910802768795559, "No": 0.008919666687148348}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.999932220207154, "res": {"Yes": 0.999932220207154, "No": 6.764703722133716e-05}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991523763760293, "res": {"Yes": 0.9991523763760293, "No": 0.0008475997724788732}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999182744197171, "res": {"Yes": 0.9999182744197171, "No": 8.159863696451186e-05}, "ground_truth": 1}, {"key": "22259982", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999937345628867, "res": {"Yes": 0.999937345628867, "No": 6.26067786861156e-05}, "ground_truth": 0}, {"key": "22259982", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.4996017276671424e-06}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998941975374753, "res": {"Yes": 0.9998941975374753, "No": 0.0001056966879517019}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998944359222794, "res": {"Yes": 0.9998944359222794, "No": 0.00010545544674277793}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991097789320968, "res": {"Yes": 0.9991097789320968, "No": 0.0008902266186086841}, "ground_truth": 1}, {"key": "34026805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999974223173222, "res": {"Yes": 0.9999974223173222, "No": 2.4549233971373113e-06}, "ground_truth": 0}, {"key": "34026805", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6633291211347406, "res": {"Yes": 0.6633291211347406, "No": 0.33667089449090976}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9996961619681268, "res": {"Yes": 0.9996961619681268, "No": 0.00030374956360557906}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998938399653753, "res": {"Yes": 0.9998938399653753, "No": 0.00010611161989598356}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999055207534452, "res": {"Yes": 0.9999055207534452, "No": 9.439419314493679e-05}, "ground_truth": 1}, {"key": "36713809", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991138282123433, "res": {"Yes": 0.9991138282123433, "No": 0.0008861375243923678}, "ground_truth": 0}, {"key": "36713809", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999112420092235, "res": {"Yes": 0.9999112420092235, "No": 8.868480421093794e-05}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9987816951366845, "res": {"Yes": 0.9987816951366845, "No": 0.0012182672703275957}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9511553018846574, "res": {"Yes": 0.9511553018846574, "No": 0.04884466101087967}, "ground_truth": 1}, {"key": "39726411", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 5.133427942600308e-07}, "ground_truth": 0}, {"key": "39726411", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 3.4797434087991576e-06, "res": {"No": 0.9999963494876631, "Yes": 3.4797434087991576e-06}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.001066700542238775, "res": {"No": 0.998932987762818, "Yes": 0.001066700542238775}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997628759583507, "res": {"Yes": 0.9997628759583507, "No": 0.0002370259332072456}, "ground_truth": 0}, {"key": "37069841", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999200623291858, "res": {"Yes": 0.9999200623291858, "No": 7.981153620375848e-05}, "ground_truth": 1}, {"key": "37069841", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998062530813588, "res": {"Yes": 0.9998062530813588, "No": 0.0001937271174867023}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9625387845458433, "res": {"Yes": 0.9625387845458433, "No": 0.037461183079135534}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.363993816161813e-07}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 8.787934876152156e-08}, "ground_truth": 1}, {"key": "38894693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.7201653011918064e-07}, "ground_truth": 0}, {"key": "38894693", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9961346162030787, "res": {"Yes": 0.9961346162030787, "No": 0.0038653347116760304}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9771061421010151, "res": {"Yes": 0.9771061421010151, "No": 0.02289376216659248}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 7.194872726029328e-07}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999603507610518, "res": {"Yes": 0.9999603507610518, "No": 3.956047674873093e-05}, "ground_truth": 1}, {"key": "33946032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99814792441259, "res": {"Yes": 0.99814792441259, "No": 0.00185205026907031}, "ground_truth": 0}, {"key": "33946032", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9861709165941088, "res": {"Yes": 0.9861709165941088, "No": 0.013829033777368433}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9826748899908496, "res": {"Yes": 0.9826748899908496, "No": 0.017325064690045168}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999374648254056, "res": {"Yes": 0.9999374648254056, "No": 6.248750132627134e-05}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6734198469090918, "res": {"Yes": 0.6734198469090918, "No": 0.32658004484204106}, "ground_truth": 1}, {"key": "39035311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9956433657845736, "res": {"Yes": 0.9956433657845736, "No": 0.004356581451161574}, "ground_truth": 0}, {"key": "39035311", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.5327308256088813, "res": {"Yes": 0.5327308256088813, "No": 0.46726901869861376}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9740665209582489, "res": {"Yes": 0.9740665209582489, "No": 0.02593344838593757}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998433152563369, "res": {"Yes": 0.9998433152563369, "No": 0.00015658649765435805}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9894052746919906, "res": {"Yes": 0.9894052746919906, "No": 0.01059461421406337}, "ground_truth": 1}, {"key": "27680038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995279703410699, "res": {"Yes": 0.9995279703410699, "No": 0.00047191248627673666}, "ground_truth": 0}, {"key": "27680038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.966187339830845, "res": {"Yes": 0.966187339830845, "No": 0.03381261233800607}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.389521659366683e-06, "res": {"No": 0.9999984951481323, "Yes": 1.389521659366683e-06}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995283277923265, "res": {"Yes": 0.9995283277923265, "No": 0.0004715797165905838}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9539003766293411, "res": {"Yes": 0.9539003766293411, "No": 0.04609960948761054}, "ground_truth": 1}, {"key": "36901907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999908661547138, "res": {"Yes": 0.9999908661547138, "No": 9.082409837117232e-06}, "ground_truth": 0}, {"key": "36901907", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.9159963369751894e-06}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9951119927796586, "res": {"Yes": 0.9951119927796586, "No": 0.004887989036779872}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998639308082523, "res": {"Yes": 0.9998639308082523, "No": 0.0001359556266635581}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999309090568892, "res": {"Yes": 0.9999309090568892, "No": 6.906151008263735e-05}, "ground_truth": 1}, {"key": "21530542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999684563215123, "res": {"Yes": 0.9999684563215123, "No": 3.1502930018441156e-05}, "ground_truth": 0}, {"key": "21530542", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993900804366019, "res": {"Yes": 0.9993900804366019, "No": 0.0006098545938191671}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9535672755566259, "res": {"Yes": 0.9535672755566259, "No": 0.04643273838055261}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9334520949430661, "res": {"Yes": 0.9334520949430661, "No": 0.066547859396512}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9769020049166307, "res": {"Yes": 0.9769020049166307, "No": 0.023097913273853715}, "ground_truth": 1}, {"key": "38192532", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8958422605489833, "res": {"Yes": 0.8958422605489833, "No": 0.10415761481766864}, "ground_truth": 0}, {"key": "38192532", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9938394062570204, "res": {"Yes": 0.9938394062570204, "No": 0.00616057969212463}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9680882388724829, "res": {"Yes": 0.9680882388724829, "No": 0.031911724421253555}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995296383847244, "res": {"Yes": 0.9995296383847244, "No": 0.0004702418599409724}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7605893391156703, "res": {"Yes": 0.7605893391156703, "No": 0.23941041074082683}, "ground_truth": 1}, {"key": "34102400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997767004150644, "res": {"Yes": 0.9997767004150644, "No": 0.00022324270837394068}, "ground_truth": 0}, {"key": "34102400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999086331589397, "res": {"Yes": 0.999086331589397, "No": 0.0009136728342386257}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.15961356561353152, "res": {"No": 0.840386410851358, "Yes": 0.15961356561353152}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9982987732295737, "res": {"Yes": 0.9982987732295737, "No": 0.0017011496360131808}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999820452021894, "res": {"Yes": 0.9999820452021894, "No": 1.7926939078628326e-05}, "ground_truth": 1}, {"key": "36133399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996922331199457, "res": {"Yes": 0.9996922331199457, "No": 0.00030775578356923087}, "ground_truth": 0}, {"key": "36133399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.07745412138828955, "res": {"No": 0.9225458060919242, "Yes": 0.07745412138828955}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0033928249025780397, "res": {"No": 0.9966069327074075, "Yes": 0.0033928249025780397}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9982703911004486, "res": {"Yes": 0.9982703911004486, "No": 0.0017295783992976948}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8036599717245334, "res": {"Yes": 0.8036599717245334, "No": 0.19633998600444583}, "ground_truth": 1}, {"key": "34314544", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996934248037825, "res": {"Yes": 0.9996934248037825, "No": 0.0003065388674574195}, "ground_truth": 0}, {"key": "34314544", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9982944930327592, "res": {"Yes": 0.9982944930327592, "No": 0.001705495661393574}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.622281021675538e-06, "res": {"No": 0.9999971839107652, "Yes": 2.622281021675538e-06}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999073086401096, "res": {"Yes": 0.9999073086401096, "No": 9.258485338940715e-05}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9989774793308979, "res": {"Yes": 0.9989774793308979, "No": 0.0010225415859690281}, "ground_truth": 1}, {"key": "33460074", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9982514998106651, "res": {"Yes": 0.9982514998106651, "No": 0.0017485115426923844}, "ground_truth": 0}, {"key": "33460074", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9967818443992558, "res": {"Yes": 0.9967818443992558, "No": 0.0032181005010349763}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.13055751778636965, "res": {"No": 0.8694423672659001, "Yes": 0.13055751778636965}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.6847228644696534, "res": {"Yes": 0.6847228644696534, "No": 0.3152771139701634}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7696358870004331, "res": {"Yes": 0.7696358870004331, "No": 0.23036400284930414}, "ground_truth": 1}, {"key": "36191495", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.11528511016335058, "res": {"No": 0.8847148316710997, "Yes": 0.11528511016335058}, "ground_truth": 0}, {"key": "36191495", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9617800718437363, "res": {"Yes": 0.9617800718437363, "No": 0.03821989834143298}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8525798146364144, "res": {"Yes": 0.8525798146364144, "No": 0.14741988548728346}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.99930281990306, "res": {"Yes": 0.99930281990306, "No": 0.0006971803004171083}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999936078174301, "res": {"Yes": 0.9999936078174301, "No": 6.275904122867088e-06}, "ground_truth": 1}, {"key": "39532668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.8132314010514023e-06}, "ground_truth": 0}, {"key": "39532668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997986255585553, "res": {"Yes": 0.9997986255585553, "No": 0.0002013060844485716}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 5.288277883287546e-07, "res": {"No": 0.9999994487765019, "Yes": 5.288277883287546e-07}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9922705609417645, "res": {"Yes": 0.9922705609417645, "No": 0.007729364746743159}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.282190125030222e-07}, "ground_truth": 1}, {"key": "20328247", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8470393646722963, "res": {"Yes": 0.8470393646722963, "No": 0.15296058578882854}, "ground_truth": 0}, {"key": "20328247", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998118545815696, "res": {"Yes": 0.9998118545815696, "No": 0.00018806385472701687}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9839799117760575, "res": {"Yes": 0.9839799117760575, "No": 0.016020122350684833}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.3372000450148802e-07}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.516245083203239e-08}, "ground_truth": 1}, {"key": "39112675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 4.179646794121244e-08}, "ground_truth": 0}, {"key": "39112675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.984908992972359, "res": {"Yes": 0.984908992972359, "No": 0.015090935702603295}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9135822764053642, "res": {"Yes": 0.9135822764053642, "No": 0.08641768816442168}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999684563215123, "res": {"Yes": 0.9999684563215123, "No": 3.148841051470542e-05}, "ground_truth": 1}, {"key": "31620300", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986254733283209, "res": {"Yes": 0.9986254733283209, "No": 0.0013745553252318323}, "ground_truth": 0}, {"key": "31620300", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00020294957678461875, "res": {"No": 0.9997968378602231, "Yes": 0.00020294957678461875}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.816587538858012, "res": {"Yes": 0.816587538858012, "No": 0.1834124201144374}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9988133322476874, "res": {"Yes": 0.9988133322476874, "No": 0.0011866162614436288}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996479149564914, "res": {"Yes": 0.9996479149564914, "No": 0.0003519705678234359}, "ground_truth": 1}, {"key": "37518509", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999620195462757, "res": {"Yes": 0.9999620195462757, "No": 3.7876374665299275e-05}, "ground_truth": 0}, {"key": "37518509", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.5224163310120646, "res": {"Yes": 0.5224163310120646, "No": 0.47758365532891267}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999964686909351, "res": {"Yes": 0.9999964686909351, "No": 3.4796181402912885e-06}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999057591369491, "res": {"Yes": 0.9999057591369491, "No": 9.412338782614371e-05}, "ground_truth": 1}, {"key": "35454095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9742013625265175, "res": {"Yes": 0.9742013625265175, "No": 0.025798394955935555}, "ground_truth": 0}, {"key": "35454095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9679661386992416, "res": {"Yes": 0.9679661386992416, "No": 0.03203380588210923}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9994605754817469, "res": {"Yes": 0.9994605754817469, "No": 0.0005394081704931928}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998101860569464, "res": {"Yes": 0.9998101860569464, "No": 0.00018975552971597158}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990608712976465, "res": {"Yes": 0.9990608712976465, "No": 0.0009390739761657317}, "ground_truth": 1}, {"key": "38542788", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.993277015662335, "res": {"Yes": 0.993277015662335, "No": 0.0067228406365033066}, "ground_truth": 0}, {"key": "38542788", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9930380826148416, "res": {"Yes": 0.9930380826148416, "No": 0.00696177366622482}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.8911640859511444e-06, "res": {"No": 0.9999980183344636, "Yes": 1.8911640859511444e-06}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999589203757908, "res": {"Yes": 0.9999589203757908, "No": 4.1039891535599575e-05}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999902701413353, "res": {"Yes": 0.9999902701413353, "No": 9.636322553265875e-06}, "ground_truth": 1}, {"key": "23944937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9979144889065413, "res": {"Yes": 0.9979144889065413, "No": 0.002085454211947185}, "ground_truth": 0}, {"key": "23944937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9918880617917674, "res": {"Yes": 0.9918880617917674, "No": 0.008111901294865928}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.001023620936599571, "res": {"No": 0.9989762886503498, "Yes": 0.001023620936599571}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.987000881932917, "res": {"Yes": 0.987000881932917, "No": 0.012998985019392395}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998497475990228, "res": {"Yes": 0.9998497475990228, "No": 0.000150149213746829}, "ground_truth": 1}, {"key": "31753944", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999170824878469, "res": {"Yes": 0.9999170824878469, "No": 8.280202834109297e-05}, "ground_truth": 0}, {"key": "31753944", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998953894470656, "res": {"Yes": 0.9998953894470656, "No": 0.000104529210427229}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.14926088470826993, "res": {"No": 0.8507391662791352, "Yes": 0.14926088470826993}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999813299942867, "res": {"Yes": 0.9999813299942867, "No": 1.8650362034972367e-05}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991031131436655, "res": {"Yes": 0.9991031131436655, "No": 0.0008967853699091676}, "ground_truth": 1}, {"key": "35527214", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998050612730233, "res": {"Yes": 0.9998050612730233, "No": 0.00019488615312965893}, "ground_truth": 0}, {"key": "35527214", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8287223015511397, "res": {"Yes": 0.8287223015511397, "No": 0.17127765942352993}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.009420557590012034, "res": {"No": 0.9905791300886627, "Yes": 0.009420557590012034}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0006996243568719384, "res": {"No": 0.9993001992748232, "Yes": 0.0006996243568719384}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9977426262090467, "res": {"Yes": 0.9977426262090467, "No": 0.0022573825513648943}, "ground_truth": 1}, {"key": "40400404", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997534721429874, "res": {"Yes": 0.9997534721429874, "No": 0.00024646193458409865}, "ground_truth": 0}, {"key": "40400404", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9878635520344143, "res": {"Yes": 0.9878635520344143, "No": 0.012136323270159602}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999129107124922, "res": {"Yes": 0.9999129107124922, "No": 8.695498387023749e-05}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9970941453923705, "res": {"Yes": 0.9970941453923705, "No": 0.0029057826795281213}, "ground_truth": 1}, {"key": "21713119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999552252224203, "res": {"Yes": 0.9999552252224203, "No": 4.472423648678761e-05}, "ground_truth": 0}, {"key": "21713119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993079384451427, "res": {"Yes": 0.9993079384451427, "No": 0.0006920566787448797}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998980116571646, "res": {"Yes": 0.9998980116571646, "No": 0.00010190143860741199}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998561836525626, "res": {"Yes": 0.9998561836525626, "No": 0.00014372597826106253}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999748931371826, "res": {"Yes": 0.9999748931371826, "No": 2.50153230213836e-05}, "ground_truth": 1}, {"key": "28730678", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996569676190656, "res": {"Yes": 0.9996569676190656, "No": 0.00034294927775455715}, "ground_truth": 0}, {"key": "28730678", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999994561441089, "res": {"Yes": 0.999994561441089, "No": 5.4158105643839106e-06}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0009579863773305479, "res": {"No": 0.9990419505826718, "Yes": 0.0009579863773305479}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.952139250836863, "res": {"Yes": 0.952139250836863, "No": 0.047860660305136346}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993508009909248, "res": {"Yes": 0.9993508009909248, "No": 0.0006491735925897352}, "ground_truth": 1}, {"key": "36823733", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999975489140396, "res": {"Yes": 0.999975489140396, "No": 2.4402596924416144e-05}, "ground_truth": 0}, {"key": "36823733", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0029215195623412144, "res": {"No": 0.9970785185568329, "Yes": 0.0029215195623412144}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9892325979759623, "res": {"Yes": 0.9892325979759623, "No": 0.010767294784560826}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7631957099488971, "res": {"Yes": 0.7631957099488971, "No": 0.236804304109353}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997976721210466, "res": {"Yes": 0.9997976721210466, "No": 0.00020221016108391425}, "ground_truth": 1}, {"key": "35988862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.04377640961316266, "res": {"No": 0.9562234327236437, "Yes": 0.04377640961316266}, "ground_truth": 0}, {"key": "35988862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00018212031825455804, "res": {"No": 0.9998176908203386, "Yes": 0.00018212031825455804}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7350528555808293, "res": {"Yes": 0.7350528555808293, "No": 0.264947019340756}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0014924871835060743, "res": {"No": 0.9985073194574551, "Yes": 0.0014924871835060743}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9985736391210275, "res": {"Yes": 0.9985736391210275, "No": 0.001426351205709443}, "ground_truth": 1}, {"key": "40499665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.13607691522309245, "res": {"No": 0.8639225633042328, "Yes": 0.13607691522309245}, "ground_truth": 0}, {"key": "40499665", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.04655380679395794, "res": {"No": 0.953445986652793, "Yes": 0.04655380679395794}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 5.5144369762437e-06, "res": {"No": 0.9999943230348141, "Yes": 5.5144369762437e-06}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.5080558787060891, "res": {"Yes": 0.5080558787060891, "No": 0.49194399513278364}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9977388276105512, "res": {"Yes": 0.9977388276105512, "No": 0.0022611143771296325}, "ground_truth": 1}, {"key": "32829820", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8480577110690073, "res": {"Yes": 0.8480577110690073, "No": 0.15194225980630383}, "ground_truth": 0}, {"key": "32829820", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6904383315286575, "res": {"Yes": 0.6904383315286575, "No": 0.30956153064793146}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9649426764982906, "res": {"Yes": 0.9649426764982906, "No": 0.03505724788010887}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999889589149532, "res": {"Yes": 0.9999889589149532, "No": 1.1008663546718355e-05}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999951574563252, "res": {"Yes": 0.9999951574563252, "No": 4.717615861824989e-06}, "ground_truth": 1}, {"key": "20583553", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.371045325918286e-07}, "ground_truth": 0}, {"key": "20583553", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999796611748367, "res": {"Yes": 0.9999796611748367, "No": 2.028363813730681e-05}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999874092852638, "res": {"Yes": 0.9999874092852638, "No": 1.2529132816885026e-05}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999759659438225, "res": {"Yes": 0.9999759659438225, "No": 2.3995721844141748e-05}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9980399833462462, "res": {"Yes": 0.9980399833462462, "No": 0.001959947679948159}, "ground_truth": 1}, {"key": "30501550", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998509394606263, "res": {"Yes": 0.9998509394606263, "No": 0.00014894521562484244}, "ground_truth": 0}, {"key": "30501550", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9959254144419615, "res": {"Yes": 0.9959254144419615, "No": 0.00407464113988117}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.23634953243939494, "res": {"No": 0.7636502901608484, "Yes": 0.23634953243939494}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999884821053314, "res": {"Yes": 0.9999884821053314, "No": 1.1412098424508236e-05}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9960336126763106, "res": {"Yes": 0.9960336126763106, "No": 0.003966343664364909}, "ground_truth": 1}, {"key": "38755897", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997283303588818, "res": {"Yes": 0.9997283303588818, "No": 0.00027160031567535905}, "ground_truth": 0}, {"key": "38755897", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.6093728323251164e-06}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7583043930533451, "res": {"Yes": 0.7583043930533451, "No": 0.2416955506515651}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9982153881168936, "res": {"Yes": 0.9982153881168936, "No": 0.0017845797957622997}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9790757016068217, "res": {"Yes": 0.9790757016068217, "No": 0.020924348460186742}, "ground_truth": 1}, {"key": "35507201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.997928262017781, "res": {"Yes": 0.997928262017781, "No": 0.002071749209078765}, "ground_truth": 0}, {"key": "35507201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997334547494989, "res": {"Yes": 0.9997334547494989, "No": 0.0002664814294235655}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9970522097907223, "res": {"Yes": 0.9970522097907223, "No": 0.0029478181277334714}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.979826947592119, "res": {"Yes": 0.979826947592119, "No": 0.02017302022001168}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997216604436437, "res": {"Yes": 0.9997216604436437, "No": 0.0002782387499701819}, "ground_truth": 1}, {"key": "36453511", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998872844828712, "res": {"Yes": 0.9998872844828712, "No": 0.00011264728416357835}, "ground_truth": 0}, {"key": "36453511", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997280920336735, "res": {"Yes": 0.9997280920336735, "No": 0.00027186770191844006}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.02681029294734623, "res": {"No": 0.9731895985648042, "Yes": 0.02681029294734623}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.00955975958736696, "res": {"No": 0.9904401893179047, "Yes": 0.00955975958736696}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.18418612200346768, "res": {"No": 0.8158138051649082, "Yes": 0.18418612200346768}, "ground_truth": 1}, {"key": "38066835", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9754149341771388, "res": {"Yes": 0.9754149341771388, "No": 0.024584847035512655}, "ground_truth": 0}, {"key": "38066835", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00034804387797602015, "res": {"No": 0.9996517244820033, "Yes": 0.00034804387797602015}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8531232601461672, "res": {"Yes": 0.8531232601461672, "No": 0.14687652663897943}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998820401278129, "res": {"Yes": 0.9998820401278129, "No": 0.00011785458782270268}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.896275644072528e-07}, "ground_truth": 1}, {"key": "39697181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999690523188893, "res": {"Yes": 0.9999690523188893, "No": 3.090838659637265e-05}, "ground_truth": 0}, {"key": "39697181", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992798445365096, "res": {"Yes": 0.9992798445365096, "No": 0.0007201293567058609}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.06408302312361712, "res": {"No": 0.9359167114101306, "Yes": 0.06408302312361712}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981293961642673, "res": {"Yes": 0.9981293961642673, "No": 0.0018705260079421545}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8373166454983408, "res": {"Yes": 0.8373166454983408, "No": 0.1626832532979152}, "ground_truth": 1}, {"key": "21820893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999462853826817, "res": {"Yes": 0.9999462853826817, "No": 5.367324025100189e-05}, "ground_truth": 0}, {"key": "21820893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9958366190016907, "res": {"Yes": 0.9958366190016907, "No": 0.004163392634247119}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.001726518026712353, "res": {"No": 0.9982732395692464, "Yes": 0.001726518026712353}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 8.733452298330147e-08}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9422791007427962, "res": {"Yes": 0.9422791007427962, "No": 0.057720216166218447}, "ground_truth": 1}, {"key": "40519933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9722629815164352, "res": {"Yes": 0.9722629815164352, "No": 0.02773671200888418}, "ground_truth": 0}, {"key": "40519933", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9961621740507391, "res": {"Yes": 0.9961621740507391, "No": 0.003837614228989169}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 4.915893192538116e-05, "res": {"No": 0.999950814892627, "Yes": 4.915893192538116e-05}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9925031337450829, "res": {"Yes": 0.9925031337450829, "No": 0.007496830108368716}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999947998470209, "res": {"Yes": 0.9999947998470209, "No": 5.111615801062983e-06}, "ground_truth": 1}, {"key": "30446033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.2714417089130946e-08}, "ground_truth": 0}, {"key": "30446033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999186320055549, "res": {"Yes": 0.9999186320055549, "No": 8.12390106045446e-05}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9227341445894365, "res": {"Yes": 0.9227341445894365, "No": 0.07726569595189674}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.14667830376987323, "res": {"No": 0.8533216514306934, "Yes": 0.14667830376987323}, "ground_truth": 1}, {"key": "40216291", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6807980949356652, "res": {"Yes": 0.6807980949356652, "No": 0.31920172796402657}, "ground_truth": 0}, {"key": "40216291", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.02002807980201416, "res": {"No": 0.9799718580552427, "Yes": 0.02002807980201416}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9289167320443014, "res": {"Yes": 0.9289167320443014, "No": 0.07108323959427221}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996321967562031, "res": {"Yes": 0.9996321967562031, "No": 0.000367728229286459}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999946806438478, "res": {"Yes": 0.9999946806438478, "No": 5.216723683299374e-06}, "ground_truth": 1}, {"key": "33479118", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997178470126431, "res": {"Yes": 0.9997178470126431, "No": 0.0002820593635887905}, "ground_truth": 0}, {"key": "33479118", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999948788531352, "res": {"Yes": 0.999948788531352, "No": 5.115982509723478e-05}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.18826270961989977, "res": {"No": 0.8117370510666168, "Yes": 0.18826270961989977}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.48970175326325044, "res": {"No": 0.5102982093156433, "Yes": 0.48970175326325044}, "ground_truth": 1}, {"key": "22297373", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9927356935538236, "res": {"Yes": 0.9927356935538236, "No": 0.007264276310985446}, "ground_truth": 0}, {"key": "22297373", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9551335340937609, "res": {"Yes": 0.9551335340937609, "No": 0.04486636832404951}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.5153207122030398, "res": {"Yes": 0.5153207122030398, "No": 0.48467922432786803}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9050101770376227, "res": {"Yes": 0.9050101770376227, "No": 0.09498974885437558}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996835339659427, "res": {"Yes": 0.9996835339659427, "No": 0.00031642098499907003}, "ground_truth": 1}, {"key": "36463668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997523995780452, "res": {"Yes": 0.9997523995780452, "No": 0.00024748588695138883}, "ground_truth": 0}, {"key": "36463668", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9795133395071245, "res": {"Yes": 0.9795133395071245, "No": 0.020486638209639245}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.1391069523990753, "res": {"No": 0.8608930227077369, "Yes": 0.1391069523990753}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999958726752174, "res": {"Yes": 0.9999958726752174, "No": 4.02985565606797e-06}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999378224131062, "res": {"Yes": 0.9999378224131062, "No": 6.214833688872199e-05}, "ground_truth": 1}, {"key": "35264615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.5848476187515172e-06}, "ground_truth": 0}, {"key": "35264615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999797803764193, "res": {"Yes": 0.9999797803764193, "No": 2.014607656388599e-05}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.758811795688029e-05, "res": {"No": 0.9999820452021894, "Yes": 1.758811795688029e-05}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.4068093625315235, "res": {"No": 0.5931902886352252, "Yes": 0.4068093625315235}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9818735379619679, "res": {"Yes": 0.9818735379619679, "No": 0.018126070824756254}, "ground_truth": 1}, {"key": "39898482", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9843161233075763, "res": {"Yes": 0.9843161233075763, "No": 0.015683595272576484}, "ground_truth": 0}, {"key": "39898482", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998328270349577, "res": {"Yes": 0.9998328270349577, "No": 0.00016705741537401}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9995263059284794, "res": {"Yes": 0.9995263059284794, "No": 0.00047359406791037625}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9647179549759772, "res": {"Yes": 0.9647179549759772, "No": 0.03528195978235065}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.263247342057965e-07}, "ground_truth": 1}, {"key": "37228721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.128480953582273e-06}, "ground_truth": 0}, {"key": "37228721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9927613064651225, "res": {"Yes": 0.9927613064651225, "No": 0.007238709748494379}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.409007051937659e-07, "res": {"No": 0.9999994487765019, "Yes": 2.409007051937659e-07}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999500997050611, "res": {"Yes": 0.9999500997050611, "No": 4.9850850525843485e-05}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 5.135584435167939e-07}, "ground_truth": 1}, {"key": "24535799", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998810866107576, "res": {"Yes": 0.9998810866107576, "No": 0.00011884053565704228}, "ground_truth": 0}, {"key": "24535799", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 5.952520503858974e-08}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 8.970267210408655e-05, "res": {"No": 0.9999101692710216, "Yes": 8.970267210408655e-05}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4726854309665554e-06}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 1.2508167575186531e-08}, "ground_truth": 1}, {"key": "35177759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999971839107652, "res": {"Yes": 0.9999971839107652, "No": 2.7489294857038155e-06}, "ground_truth": 0}, {"key": "35177759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9991322665985597, "res": {"Yes": 0.9991322665985597, "No": 0.0008676492628689601}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0005302062903880915, "res": {"No": 0.9994695073210252, "Yes": 0.0005302062903880915}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999526028632798, "res": {"Yes": 0.9999526028632798, "No": 4.7295992084472936e-05}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9945454401290562, "res": {"Yes": 0.9945454401290562, "No": 0.00545452139764436}, "ground_truth": 1}, {"key": "34364829", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7825603460411359, "res": {"Yes": 0.7825603460411359, "No": 0.21743935389524366}, "ground_truth": 0}, {"key": "34364829", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9466081043600487, "res": {"Yes": 0.9466081043600487, "No": 0.053391752100084275}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9997521612171065, "res": {"Yes": 0.9997521612171065, "No": 0.00024778156158303683}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999967070975216, "res": {"Yes": 0.9999967070975216, "No": 3.1681808473120136e-06}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999968263007362, "res": {"Yes": 0.9999968263007362, "No": 3.0753495142322533e-06}, "ground_truth": 1}, {"key": "38090732", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.442521404787603e-06}, "ground_truth": 0}, {"key": "38090732", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999970244320709, "res": {"Yes": 0.999970244320709, "No": 2.965671448439412e-05}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0002608447904851693, "res": {"No": 0.999738936662965, "Yes": 0.0002608447904851693}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999700059218314, "res": {"Yes": 0.9999700059218314, "No": 2.997094936380826e-05}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999740587314805, "res": {"Yes": 0.9999740587314805, "No": 2.5832039381128413e-05}, "ground_truth": 1}, {"key": "30651479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999858596579756, "res": {"Yes": 0.9999858596579756, "No": 1.4045591270541697e-05}, "ground_truth": 0}, {"key": "30651479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998976540877003, "res": {"Yes": 0.9998976540877003, "No": 0.00010222462092112238}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0039542315302185695, "res": {"No": 0.9960457948395113, "Yes": 0.0039542315302185695}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0013934667111350245, "res": {"No": 0.9986064490950908, "Yes": 0.0013934667111350245}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7109459085938805, "res": {"Yes": 0.7109459085938805, "No": 0.28905413213041337}, "ground_truth": 1}, {"key": "39380921", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9650506953322091, "res": {"Yes": 0.9650506953322091, "No": 0.034949266417764864}, "ground_truth": 0}, {"key": "39380921", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9974997674011004, "res": {"Yes": 0.9974997674011004, "No": 0.0025002788833239794}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.3168660974068124, "res": {"No": 0.6831337440910299, "Yes": 0.3168660974068124}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9992527153963205, "res": {"Yes": 0.9992527153963205, "No": 0.0007472092437054692}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.89755635031837e-08}, "ground_truth": 1}, {"key": "39037490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 6.035107402282947e-07}, "ground_truth": 0}, {"key": "39037490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995358340883432, "res": {"Yes": 0.9995358340883432, "No": 0.00046408956330527866}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.10047588806696914, "res": {"No": 0.899524075971801, "Yes": 0.10047588806696914}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9920934782797385, "res": {"Yes": 0.9920934782797385, "No": 0.007906453138320514}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9975193356457229, "res": {"Yes": 0.9975193356457229, "No": 0.0024806615508571163}, "ground_truth": 1}, {"key": "35917499", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998448646647308, "res": {"Yes": 0.9998448646647308, "No": 0.0001550850316772788}, "ground_truth": 0}, {"key": "35917499", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9758065101693871, "res": {"Yes": 0.9758065101693871, "No": 0.024193371216864698}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7805774286806619, "res": {"Yes": 0.7805774286806619, "No": 0.21942238677439163}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.3974254200943381e-06}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999971839107652, "res": {"Yes": 0.9999971839107652, "No": 2.7022197313217563e-06}, "ground_truth": 1}, {"key": "34908073", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.662207961229273e-07}, "ground_truth": 0}, {"key": "34908073", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.7068911090715172e-07}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.059619975599459446, "res": {"No": 0.9403797048035788, "Yes": 0.059619975599459446}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.3661268933735397e-07}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.616854590315955e-07}, "ground_truth": 1}, {"key": "36344759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999956342685299, "res": {"Yes": 0.9999956342685299, "No": 4.305217063936258e-06}, "ground_truth": 0}, {"key": "36344759", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.3852637544911333e-06}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.2513532647670297, "res": {"No": 0.7486466718077669, "Yes": 0.2513532647670297}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 2.7668997372623337e-05, "res": {"No": 0.9999722707254635, "Yes": 2.7668997372623337e-05}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 1.2394549715916606e-08}, "ground_truth": 1}, {"key": "39984637", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 3.175035279550488e-08}, "ground_truth": 0}, {"key": "39984637", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.996623394497695, "res": {"Yes": 0.996623394497695, "No": 0.00337659997609766}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9979943877335121, "res": {"Yes": 0.9979943877335121, "No": 0.002005608044718787}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994088959708619, "res": {"Yes": 0.9994088959708619, "No": 0.0005910550486334725}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998844239234294, "res": {"Yes": 0.9998844239234294, "No": 0.00011555430099477447}, "ground_truth": 1}, {"key": "17917326", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998758496172967, "res": {"Yes": 0.9998758496172967, "No": 0.00012411537269209114}, "ground_truth": 0}, {"key": "17917326", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983868176796534, "res": {"Yes": 0.9983868176796534, "No": 0.0016130948146669804}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 7.262756681564243e-05, "res": {"No": 0.9999269756164101, "Yes": 7.262756681564243e-05}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 5.297826546893958e-07}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9287717357443079, "res": {"Yes": 0.9287717357443079, "No": 0.0712282050972662}, "ground_truth": 1}, {"key": "32193638", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.4028239178164795e-07}, "ground_truth": 0}, {"key": "32193638", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0016315317198186071, "res": {"No": 0.9983684041021875, "Yes": 0.0016315317198186071}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999820452021894, "res": {"Yes": 0.9999820452021894, "No": 1.7935492268342405e-05}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999695291212467, "res": {"Yes": 0.9999695291212467, "No": 3.0342141595471925e-05}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9952690158279638, "res": {"Yes": 0.9952690158279638, "No": 0.004730925640302403}, "ground_truth": 1}, {"key": "34564692", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 2.9426794915359877e-06}, "ground_truth": 0}, {"key": "34564692", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9327399700820579, "res": {"Yes": 0.9327399700820579, "No": 0.06725990399785363}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.12438030887403277, "res": {"No": 0.8756194589669714, "Yes": 0.12438030887403277}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999808531883025, "res": {"Yes": 0.9999808531883025, "No": 1.9125156409702844e-05}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999961110815618, "res": {"Yes": 0.9999961110815618, "No": 3.7896666419785593e-06}, "ground_truth": 1}, {"key": "39329284", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999983356420506, "res": {"Yes": 0.999983356420506, "No": 1.6599549525301868e-05}, "ground_truth": 0}, {"key": "39329284", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.2394955284834564e-05, "res": {"No": 0.9999874092852638, "Yes": 1.2394955284834564e-05}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.37874356969714035, "res": {"No": 0.6212563998841336, "Yes": 0.37874356969714035}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.5257625836610372, "res": {"Yes": 0.5257625836610372, "No": 0.4742373709698614}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984899712424417, "res": {"Yes": 0.9984899712424417, "No": 0.0015099505153253656}, "ground_truth": 1}, {"key": "37438541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999531988512079, "res": {"Yes": 0.9999531988512079, "No": 4.670113918051012e-05}, "ground_truth": 0}, {"key": "37438541", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9973984794350517, "res": {"Yes": 0.9973984794350517, "No": 0.0026015496298974323}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00015531829973692364, "res": {"No": 0.9998445071102727, "Yes": 0.00015531829973692364}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993001992748232, "res": {"Yes": 0.9993001992748232, "No": 0.0006997018095751725}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998852582493383, "res": {"Yes": 0.9998852582493383, "No": 0.00011464731133543679}, "ground_truth": 1}, {"key": "34652757", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999474773593622, "res": {"Yes": 0.9999474773593622, "No": 5.239795469171124e-05}, "ground_truth": 0}, {"key": "34652757", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999888397127765, "res": {"Yes": 0.9999888397127765, "No": 1.1065327356906161e-05}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999907469518097, "res": {"Yes": 0.9999907469518097, "No": 9.153612022640396e-06}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.4299416667515113e-07}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999868132749457, "res": {"Yes": 0.9999868132749457, "No": 1.3079669236294897e-05}, "ground_truth": 1}, {"key": "31361004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.330068464282908e-07}, "ground_truth": 0}, {"key": "31361004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998537999282723, "res": {"Yes": 0.9998537999282723, "No": 0.00014609828175833717}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.5559344429759073, "res": {"Yes": 0.5559344429759073, "No": 0.4440656087551033}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.014061088182058703, "res": {"No": 0.9859388702692182, "Yes": 0.014061088182058703}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9790461075328616, "res": {"Yes": 0.9790461075328616, "No": 0.020953910318148198}, "ground_truth": 1}, {"key": "26150727", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992348593694926, "res": {"Yes": 0.9992348593694926, "No": 0.000765107891072814}, "ground_truth": 0}, {"key": "26150727", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997519228962147, "res": {"Yes": 0.9997519228962147, "No": 0.0002479620122359374}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9266982952345096, "res": {"Yes": 0.9266982952345096, "No": 0.07330139785089117}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9948064583151762, "res": {"Yes": 0.9948064583151762, "No": 0.0051934503259494546}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.990063197532016, "res": {"Yes": 0.990063197532016, "No": 0.009936718933275981}, "ground_truth": 1}, {"key": "36997402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8941625652635787, "res": {"Yes": 0.8941625652635787, "No": 0.10583701103333386}, "ground_truth": 0}, {"key": "36997402", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.857592820773668, "res": {"Yes": 0.857592820773668, "No": 0.14240694644202923}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.707714329418784e-07}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.641483639471711e-08}, "ground_truth": 1}, {"key": "37430643", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999843100330889, "res": {"Yes": 0.9999843100330889, "No": 1.5646645640838877e-05}, "ground_truth": 0}, {"key": "37430643", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9973312372957991, "res": {"Yes": 0.9973312372957991, "No": 0.0026687894470514956}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6988963157576994, "res": {"Yes": 0.6988963157576994, "No": 0.30110341554555065}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998681023692575, "res": {"Yes": 0.9998681023692575, "No": 0.00013182160852223316}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9896501719174535, "res": {"Yes": 0.9896501719174535, "No": 0.010349500720495257}, "ground_truth": 1}, {"key": "36964631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999961110815618, "res": {"Yes": 0.9999961110815618, "No": 3.7681439450600182e-06}, "ground_truth": 0}, {"key": "36964631", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999925349918634, "res": {"Yes": 0.9999925349918634, "No": 7.354302807810537e-06}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8877706023944094, "res": {"Yes": 0.8877706023944094, "No": 0.1122293649992908}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.6230929025774766, "res": {"Yes": 0.6230929025774766, "No": 0.3769070589165419}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983341813187226, "res": {"Yes": 0.9983341813187226, "No": 0.0016657749973009622}, "ground_truth": 1}, {"key": "35502013", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.1326248776968134e-06}, "ground_truth": 0}, {"key": "35502013", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.005119152402611368, "res": {"No": 0.9948807904441619, "Yes": 0.005119152402611368}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6876387167335111, "res": {"Yes": 0.6876387167335111, "No": 0.3123608465553655}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999080237900709, "res": {"Yes": 0.9999080237900709, "No": 9.190161089270032e-05}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.863081557350681e-07}, "ground_truth": 1}, {"key": "33987664", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990791969995056, "res": {"Yes": 0.9990791969995056, "No": 0.0009207481609317872}, "ground_truth": 0}, {"key": "33987664", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9970753132536714, "res": {"Yes": 0.9970753132536714, "No": 0.002924633807946991}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.17512161562386244, "res": {"No": 0.8248781586821928, "Yes": 0.17512161562386244}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999012298380936, "res": {"Yes": 0.9999012298380936, "No": 9.864450786303324e-05}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.24073621223399255, "res": {"No": 0.7592636476841383, "Yes": 0.24073621223399255}, "ground_truth": 1}, {"key": "35203721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5427960435568476, "res": {"Yes": 0.5427960435568476, "No": 0.4572039077332091}, "ground_truth": 0}, {"key": "35203721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9238953549246708, "res": {"Yes": 0.9238953549246708, "No": 0.0761045748216175}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9189303485293009, "res": {"Yes": 0.9189303485293009, "No": 0.08106961897047843}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999846676395419, "res": {"Yes": 0.9999846676395419, "No": 1.526764003184864e-05}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.895000689532206e-07}, "ground_truth": 1}, {"key": "39028348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.111520225634009e-07}, "ground_truth": 0}, {"key": "39028348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998764455634782, "res": {"Yes": 0.9998764455634782, "No": 0.00012344251201837215}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.25186896672933456, "res": {"No": 0.7481307625821122, "Yes": 0.25186896672933456}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.45508395980966526, "res": {"No": 0.5449156483321802, "Yes": 0.45508395980966526}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9894799711786098, "res": {"Yes": 0.9894799711786098, "No": 0.01051993763418033}, "ground_truth": 1}, {"key": "37459383", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9892569749459891, "res": {"Yes": 0.9892569749459891, "No": 0.010742902231600416}, "ground_truth": 0}, {"key": "37459383", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9185610586987052, "res": {"Yes": 0.9185610586987052, "No": 0.08143865838314385}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7993584983916431, "res": {"Yes": 0.7993584983916431, "No": 0.20064148906282586}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996575634447856, "res": {"Yes": 0.9996575634447856, "No": 0.00034240312054396556}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999418750973176, "res": {"Yes": 0.9999418750973176, "No": 5.807373858449999e-05}, "ground_truth": 1}, {"key": "34020070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986431885021702, "res": {"Yes": 0.9986431885021702, "No": 0.0013567379860601075}, "ground_truth": 0}, {"key": "34020070", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9979411954514522, "res": {"Yes": 0.9979411954514522, "No": 0.0020588397150173208}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.26492550651621805, "res": {"No": 0.735074444400228, "Yes": 0.26492550651621805}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 2.9362655650240736e-06}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999950814892627, "res": {"Yes": 0.999950814892627, "No": 4.910081129404509e-05}, "ground_truth": 1}, {"key": "35176615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999906277489198, "res": {"Yes": 0.9999906277489198, "No": 9.238675747054018e-06}, "ground_truth": 0}, {"key": "35176615", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6972410002859543, "res": {"Yes": 0.6972410002859543, "No": 0.30275893021189476}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9665517133220018, "res": {"Yes": 0.9665517133220018, "No": 0.033448257046455196}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.993335232738274, "res": {"Yes": 0.993335232738274, "No": 0.006664758900328387}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999890781166442, "res": {"Yes": 0.9999890781166442, "No": 1.0886228586108269e-05}, "ground_truth": 1}, {"key": "33296389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.526683947231001e-07}, "ground_truth": 0}, {"key": "33296389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997970762218157, "res": {"Yes": 0.9997970762218157, "No": 0.00020287673096316047}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.6472128057562887e-07}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999764427474764, "res": {"Yes": 0.9999764427474764, "No": 2.3481469025295627e-05}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 1.1222477098092205e-06}, "ground_truth": 1}, {"key": "35399504", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999953958625991, "res": {"Yes": 0.9999953958625991, "No": 4.564333759104806e-06}, "ground_truth": 0}, {"key": "35399504", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999828796125555, "res": {"Yes": 0.9999828796125555, "No": 1.708496023294936e-05}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.3188760849804624, "res": {"No": 0.6811238939076216, "Yes": 0.3188760849804624}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991120417684421, "res": {"Yes": 0.9991120417684421, "No": 0.0008879359020087139}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.5775872942060414e-07}, "ground_truth": 1}, {"key": "34807886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.3134239370567565e-07}, "ground_truth": 0}, {"key": "34807886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994586692723768, "res": {"Yes": 0.9994586692723768, "No": 0.0005412230889870314}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.002593682495902718, "res": {"No": 0.9974063082459214, "Yes": 0.002593682495902718}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999707211216348, "res": {"Yes": 0.9999707211216348, "No": 2.92270180736383e-05}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999267474727732, "res": {"Yes": 0.999267474727732, "No": 0.0007325272620133135}, "ground_truth": 1}, {"key": "37629813", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9830308262181107, "res": {"Yes": 0.9830308262181107, "No": 0.016969171879726366}, "ground_truth": 0}, {"key": "37629813", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999620195462757, "res": {"Yes": 0.9999620195462757, "No": 3.786770196856263e-05}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9957068344964055, "res": {"Yes": 0.9957068344964055, "No": 0.004293190998701298}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6092517281259544, "res": {"Yes": 0.6092517281259544, "No": 0.39074822978168516}, "ground_truth": 1}, {"key": "28084389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9593207087844161, "res": {"Yes": 0.9593207087844161, "No": 0.04067925588018215}, "ground_truth": 0}, {"key": "28084389", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999037328639782, "res": {"Yes": 0.9999037328639782, "No": 9.616289322650091e-05}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9572132773634324, "res": {"Yes": 0.9572132773634324, "No": 0.04278667314493606}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7945805608268467, "res": {"Yes": 0.7945805608268467, "No": 0.20541946904020703}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999638739590262, "res": {"Yes": 0.999638739590262, "No": 0.0003611341723945951}, "ground_truth": 1}, {"key": "35391734", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.996983594221119, "res": {"Yes": 0.996983594221119, "No": 0.0030164223565410228}, "ground_truth": 0}, {"key": "35391734", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.04281152230037578, "res": {"No": 0.9571883767411189, "Yes": 0.04281152230037578}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00019366145512427385, "res": {"No": 0.9998062530813588, "Yes": 0.00019366145512427385}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.3563574068239329, "res": {"No": 0.6436425522894444, "Yes": 0.3563574068239329}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9763184949588055, "res": {"Yes": 0.9763184949588055, "No": 0.023681446157279958}, "ground_truth": 1}, {"key": "40214591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9700916533099612, "res": {"Yes": 0.9700916533099612, "No": 0.02990826545993443}, "ground_truth": 0}, {"key": "40214591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996020607688274, "res": {"Yes": 0.9996020607688274, "No": 0.00039784721829851425}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 7.701102226933897e-05, "res": {"No": 0.9999228038037797, "Yes": 7.701102226933897e-05}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999868132749457, "res": {"Yes": 0.9999868132749457, "No": 1.305663662271903e-05}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.6284238078991994e-06}, "ground_truth": 1}, {"key": "26283171", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999847868417213, "res": {"Yes": 0.9999847868417213, "No": 1.5106582227775077e-05}, "ground_truth": 0}, {"key": "26283171", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997918323398948, "res": {"Yes": 0.9997918323398948, "No": 0.0002081286832684951}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9996931864469076, "res": {"Yes": 0.9996931864469076, "No": 0.00030678204918812565}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9960299465821393, "res": {"Yes": 0.9960299465821393, "No": 0.003970099982862653}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991438157350913, "res": {"Yes": 0.9991438157350913, "No": 0.0008561323322679055}, "ground_truth": 1}, {"key": "37084030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998030352201097, "res": {"Yes": 0.9998030352201097, "No": 0.00019686644564902565}, "ground_truth": 0}, {"key": "37084030", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9828672723432291, "res": {"Yes": 0.9828672723432291, "No": 0.017132783279736778}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998849006744357, "res": {"Yes": 0.9998849006744357, "No": 0.00011508092286254944}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999611851533157, "res": {"Yes": 0.9999611851533157, "No": 3.879438648591552e-05}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998967005557551, "res": {"Yes": 0.9998967005557551, "No": 0.0001032134896289762}, "ground_truth": 1}, {"key": "39027295", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999895549275502, "res": {"Yes": 0.9999895549275502, "No": 1.036072337219027e-05}, "ground_truth": 0}, {"key": "39027295", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999759659438225, "res": {"Yes": 0.9999759659438225, "No": 2.4014397779733422e-05}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.2675434489110561, "res": {"No": 0.7324565186921745, "Yes": 0.2675434489110561}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999831180165023, "res": {"Yes": 0.9999831180165023, "No": 1.6765187400989942e-05}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999978707566687, "res": {"Yes": 0.999978707566687, "No": 2.1174583225600482e-05}, "ground_truth": 1}, {"key": "14018647", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999908661547138, "res": {"Yes": 0.9999908661547138, "No": 9.00176399850161e-06}, "ground_truth": 0}, {"key": "14018647", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999938462231346, "res": {"Yes": 0.9999938462231346, "No": 6.125874721846914e-06}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.34892056155827317, "res": {"No": 0.6510791512909745, "Yes": 0.34892056155827317}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.014490166964153858, "res": {"No": 0.9855093823883784, "Yes": 0.014490166964153858}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7978619511849493, "res": {"Yes": 0.7978619511849493, "No": 0.2021378274787971}, "ground_truth": 1}, {"key": "37424289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9596548791899281, "res": {"Yes": 0.9596548791899281, "No": 0.04034472193037514}, "ground_truth": 0}, {"key": "37424289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.4321521904803367, "res": {"No": 0.5678475182990419, "Yes": 0.4321521904803367}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.15321825052770413, "res": {"No": 0.8467816498069319, "Yes": 0.15321825052770413}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999975415208221, "res": {"Yes": 0.9999975415208221, "No": 2.361390305229391e-06}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999967070975216, "res": {"Yes": 0.9999967070975216, "No": 3.258668114176966e-06}, "ground_truth": 1}, {"key": "37498031", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999204199166628, "res": {"Yes": 0.9999204199166628, "No": 7.951212756109022e-05}, "ground_truth": 0}, {"key": "37498031", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998417658603422, "res": {"Yes": 0.9998417658603422, "No": 0.0001581421888817295}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.861806940793134, "res": {"Yes": 0.861806940793134, "No": 0.13819308570200275}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999547484278832, "res": {"Yes": 0.9999547484278832, "No": 4.516798583771767e-05}, "ground_truth": 1}, {"key": "30104095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991234605853084, "res": {"Yes": 0.9991234605853084, "No": 0.0008764336984407846}, "ground_truth": 0}, {"key": "30104095", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.04409078391007469, "res": {"No": 0.9559091871153307, "Yes": 0.04409078391007469}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9658201366982551, "res": {"Yes": 0.9658201366982551, "No": 0.034179794964867546}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9865024815630754, "res": {"Yes": 0.9865024815630754, "No": 0.01349741221081555}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.994438156939613, "res": {"Yes": 0.994438156939613, "No": 0.005561819366806775}, "ground_truth": 1}, {"key": "37911407", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991448876471261, "res": {"Yes": 0.9991448876471261, "No": 0.0008551115753980488}, "ground_truth": 0}, {"key": "37911407", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999707211216348, "res": {"Yes": 0.9999707211216348, "No": 2.9250877053526308e-05}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9955677465558022, "res": {"Yes": 0.9955677465558022, "No": 0.004432131320054135}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999933694113825, "res": {"Yes": 0.9999933694113825, "No": 6.590904272310504e-06}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999043288267786, "res": {"Yes": 0.9999043288267786, "No": 9.555562684508539e-05}, "ground_truth": 1}, {"key": "39177472", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998037502994923, "res": {"Yes": 0.9998037502994923, "No": 0.00019620549580240743}, "ground_truth": 0}, {"key": "39177472", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999117187730169, "res": {"Yes": 0.9999117187730169, "No": 8.823966319024172e-05}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6882628806913516, "res": {"Yes": 0.6882628806913516, "No": 0.3117369050360885}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999398487531588, "res": {"Yes": 0.9999398487531588, "No": 6.0045496985612656e-05}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999132682854126, "res": {"Yes": 0.9999132682854126, "No": 8.67076016844442e-05}, "ground_truth": 1}, {"key": "32325454", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992141486430438, "res": {"Yes": 0.9992141486430438, "No": 0.0007858630636404261}, "ground_truth": 0}, {"key": "32325454", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999502733378049, "res": {"Yes": 0.999502733378049, "No": 0.0004972108879677552}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9335000896163401, "res": {"Yes": 0.9335000896163401, "No": 0.06649975603324937}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999843100330889, "res": {"Yes": 0.9999843100330889, "No": 1.5562887258011796e-05}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.2074321090115226e-07}, "ground_truth": 1}, {"key": "38395319", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.8332477003295357e-07}, "ground_truth": 0}, {"key": "38395319", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 5.662926136957314e-08}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9946134869683929, "res": {"Yes": 0.9946134869683929, "No": 0.005386531541443487}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998225772812724, "res": {"Yes": 0.9998225772812724, "No": 0.00017734953476627275}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9789044370845271, "res": {"Yes": 0.9789044370845271, "No": 0.02109555129139962}, "ground_truth": 1}, {"key": "38235895", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999135066767632, "res": {"Yes": 0.9999135066767632, "No": 8.639065912309526e-05}, "ground_truth": 0}, {"key": "38235895", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.924462575291774, "res": {"Yes": 0.924462575291774, "No": 0.07553735325302284}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00016176773274829794, "res": {"No": 0.9998380711318946, "Yes": 0.00016176773274829794}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9919932809064413, "res": {"Yes": 0.9919932809064413, "No": 0.00800665906833087}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999553444170902, "res": {"Yes": 0.9999553444170902, "No": 4.45575475895922e-05}, "ground_truth": 1}, {"key": "26543267", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999953958625991, "res": {"Yes": 0.9999953958625991, "No": 4.583979732126425e-06}, "ground_truth": 0}, {"key": "26543267", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996425527394996, "res": {"Yes": 0.9996425527394996, "No": 0.0003573219363690056}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.004548885595882151, "res": {"No": 0.9954510167096795, "Yes": 0.004548885595882151}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9976486465725638, "res": {"Yes": 0.9976486465725638, "No": 0.0023513148421359987}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998447454732317, "res": {"Yes": 0.9998447454732317, "No": 0.0001552187726086447}, "ground_truth": 1}, {"key": "39054728", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999955150656573, "res": {"Yes": 0.9999955150656573, "No": 4.350068351494012e-06}, "ground_truth": 0}, {"key": "39054728", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.2324142358666156, "res": {"No": 0.7675857188186316, "Yes": 0.2324142358666156}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.99998752848777, "res": {"Yes": 0.99998752848777, "No": 1.2388177098296772e-05}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994890391849617, "res": {"Yes": 0.9994890391849617, "No": 0.0005109422437898696}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999955150656573, "res": {"Yes": 0.9999955150656573, "No": 4.44207477055892e-06}, "ground_truth": 1}, {"key": "39158443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999709595226828, "res": {"Yes": 0.9999709595226828, "No": 2.8962345578321542e-05}, "ground_truth": 0}, {"key": "39158443", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999602315637852, "res": {"Yes": 0.9999602315637852, "No": 3.9735522382477415e-05}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999480733442354, "res": {"Yes": 0.9999480733442354, "No": 5.184925457287947e-05}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 1.3160206943431808e-06}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999946523779904, "res": {"Yes": 0.999946523779904, "No": 5.34382914829575e-05}, "ground_truth": 1}, {"key": "36254201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988709014120329, "res": {"Yes": 0.9988709014120329, "No": 0.0011291117695488532}, "ground_truth": 0}, {"key": "36254201", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9953605423871676, "res": {"Yes": 0.9953605423871676, "No": 0.004639459066665617}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.775586905722448e-07}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994291378038616, "res": {"Yes": 0.9994291378038616, "No": 0.000570835489087206}, "ground_truth": 1}, {"key": "23434347", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 5.203490502905906e-07}, "ground_truth": 0}, {"key": "23434347", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999889589149532, "res": {"Yes": 0.9999889589149532, "No": 1.1025806360847693e-05}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0032748687075376515, "res": {"No": 0.9967248726685315, "Yes": 0.0032748687075376515}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999905085465441, "res": {"Yes": 0.9999905085465441, "No": 9.360320749059472e-06}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.011294673907464534, "res": {"No": 0.9887052402020432, "Yes": 0.011294673907464534}, "ground_truth": 1}, {"key": "34397620", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999375840279578, "res": {"Yes": 0.9999375840279578, "No": 6.225442131506601e-05}, "ground_truth": 0}, {"key": "34397620", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.03411121715354993, "res": {"No": 0.9658883095868589, "Yes": 0.03411121715354993}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0016751837805374919, "res": {"No": 0.9983246719314353, "Yes": 0.0016751837805374919}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9779798934531652, "res": {"Yes": 0.9779798934531652, "No": 0.022020102342318854}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 3.9963192258817885e-08}, "ground_truth": 1}, {"key": "34340916", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 7.079679589479481e-07}, "ground_truth": 0}, {"key": "34340916", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999763235462916, "res": {"Yes": 0.9999763235462916, "No": 2.35460612975763e-05}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8407334107888148, "res": {"Yes": 0.8407334107888148, "No": 0.1592664170575387}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9770139682096003, "res": {"Yes": 0.9770139682096003, "No": 0.022986021699611857}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9966645997471062, "res": {"Yes": 0.9966645997471062, "No": 0.0033353365171914662}, "ground_truth": 1}, {"key": "30375089", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9991664196812675, "res": {"Yes": 0.9991664196812675, "No": 0.0008335288027347976}, "ground_truth": 0}, {"key": "30375089", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9978169139062325, "res": {"Yes": 0.9978169139062325, "No": 0.002183082303738957}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9233394961134831, "res": {"Yes": 0.9233394961134831, "No": 0.0766602851013491}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.984335870855729, "res": {"Yes": 0.984335870855729, "No": 0.015664003026190833}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999537948404913, "res": {"Yes": 0.9999537948404913, "No": 4.612488263986453e-05}, "ground_truth": 1}, {"key": "35807797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997142718880543, "res": {"Yes": 0.9997142718880543, "No": 0.0002855224208722052}, "ground_truth": 0}, {"key": "35807797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.26239777535919245, "res": {"No": 0.7376018784776338, "Yes": 0.26239777535919245}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.20742347552141577, "res": {"No": 0.7925764983522054, "Yes": 0.20742347552141577}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.7801552114819278e-06}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7568605170892925, "res": {"Yes": 0.7568605170892925, "No": 0.2431394334490806}, "ground_truth": 1}, {"key": "34188172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999808531883025, "res": {"Yes": 0.9999808531883025, "No": 1.9049951544320914e-05}, "ground_truth": 0}, {"key": "34188172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999256644730222, "res": {"Yes": 0.9999256644730222, "No": 7.426127054120013e-05}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9969469814684992, "res": {"Yes": 0.9969469814684992, "No": 0.0030530313399062025}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9272953089643302, "res": {"Yes": 0.9272953089643302, "No": 0.07270455802886168}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.29869747711878825, "res": {"No": 0.7013024990444142, "Yes": 0.29869747711878825}, "ground_truth": 1}, {"key": "37075567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999860980626328, "res": {"Yes": 0.9999860980626328, "No": 1.387042059522954e-05}, "ground_truth": 0}, {"key": "37075567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0019641533335991563, "res": {"No": 0.998035707951723, "Yes": 0.0019641533335991563}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6866893310691061, "res": {"Yes": 0.6866893310691061, "No": 0.3133105524425239}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.1811464890337026e-07}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 4.25678739841074e-08}, "ground_truth": 1}, {"key": "35559735", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 5.615837572066194e-08}, "ground_truth": 0}, {"key": "35559735", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 3.0396839857665806e-06}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.23093936317422722, "res": {"No": 0.7690604299916706, "Yes": 0.23093936317422722}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998905026252752, "res": {"Yes": 0.9998905026252752, "No": 0.00010945949344749311}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999939654258081, "res": {"Yes": 0.9999939654258081, "No": 5.985545970342752e-06}, "ground_truth": 1}, {"key": "33005019", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998622621767251, "res": {"Yes": 0.9998622621767251, "No": 0.00013762685284703403}, "ground_truth": 0}, {"key": "33005019", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8673071216825539, "res": {"Yes": 0.8673071216825539, "No": 0.13269266688797987}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.010581144315879209, "res": {"No": 0.9894186921078972, "Yes": 0.010581144315879209}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.99895416167051, "res": {"Yes": 0.99895416167051, "No": 0.001045779958700707}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992248575782243, "res": {"Yes": 0.9992248575782243, "No": 0.0007750763634353981}, "ground_truth": 1}, {"key": "30808252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9634304716543366, "res": {"Yes": 0.9634304716543366, "No": 0.036569489735798294}, "ground_truth": 0}, {"key": "30808252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.7053855967115523, "res": {"Yes": 0.7053855967115523, "No": 0.29461433999032904}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.31411381204630257, "res": {"No": 0.6858861480305536, "Yes": 0.31411381204630257}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999925349918634, "res": {"Yes": 0.9999925349918634, "No": 7.340654869791595e-06}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9893793704222029, "res": {"Yes": 0.9893793704222029, "No": 0.010620597531657174}, "ground_truth": 1}, {"key": "15159017", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9923240808946742, "res": {"Yes": 0.9923240808946742, "No": 0.007675920944029491}, "ground_truth": 0}, {"key": "15159017", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985663927979926, "res": {"Yes": 0.9985663927979926, "No": 0.0014335626060977351}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.01987695417509376, "res": {"No": 0.9801228911957525, "Yes": 0.01987695417509376}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990730077230515, "res": {"Yes": 0.9990730077230515, "No": 0.0009269592058509671}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993467507602515, "res": {"Yes": 0.9993467507602515, "No": 0.0006532127354783047}, "ground_truth": 1}, {"key": "24493400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998865693437434, "res": {"Yes": 0.9998865693437434, "No": 0.0001133415195848189}, "ground_truth": 0}, {"key": "24493400", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.014901710111987283, "res": {"No": 0.9850982042830447, "Yes": 0.014901710111987283}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 7.317114512402503e-06, "res": {"No": 0.9999925349918634, "Yes": 7.317114512402503e-06}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994984442211723, "res": {"Yes": 0.9994984442211723, "No": 0.0005014411025657884}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 1.3551844329729002e-06}, "ground_truth": 1}, {"key": "37791071", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.510827649404686e-07}, "ground_truth": 0}, {"key": "37791071", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999829988145218, "res": {"Yes": 0.9999829988145218, "No": 1.695925254857587e-05}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9984873564003288, "res": {"Yes": 0.9984873564003288, "No": 0.0015125807213436089}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994988016418799, "res": {"Yes": 0.9994988016418799, "No": 0.0005011545607330194}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999462853826817, "res": {"Yes": 0.9999462853826817, "No": 5.364276250703804e-05}, "ground_truth": 1}, {"key": "33528627", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999464045822857, "res": {"Yes": 0.9999464045822857, "No": 5.348357288981227e-05}, "ground_truth": 0}, {"key": "33528627", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999697353626656, "res": {"Yes": 0.999697353626656, "No": 0.0003026099123125376}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9942045602284583, "res": {"Yes": 0.9942045602284583, "No": 0.005795401040569779}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999328161869334, "res": {"Yes": 0.9999328161869334, "No": 6.71063421882114e-05}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999864556687252, "res": {"Yes": 0.9999864556687252, "No": 1.3482567543921728e-05}, "ground_truth": 1}, {"key": "39925662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999690523188893, "res": {"Yes": 0.9999690523188893, "No": 3.0916145575119396e-05}, "ground_truth": 0}, {"key": "39925662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9926862426496689, "res": {"Yes": 0.9926862426496689, "No": 0.00731377004600567}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 8.75914646737687e-05, "res": {"No": 0.9999123147445768, "Yes": 8.75914646737687e-05}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9841867808559415, "res": {"Yes": 0.9841867808559415, "No": 0.015813208613444915}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9583947974556413, "res": {"Yes": 0.9583947974556413, "No": 0.041605167528267775}, "ground_truth": 1}, {"key": "29213416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999272140090287, "res": {"Yes": 0.9999272140090287, "No": 7.271542664448711e-05}, "ground_truth": 0}, {"key": "29213416", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.2112146424016386, "res": {"No": 0.7887853802746833, "Yes": 0.2112146424016386}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.5071396852622564, "res": {"Yes": 0.5071396852622564, "No": 0.4928603553164059}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999779923581718, "res": {"Yes": 0.9999779923581718, "No": 2.1887934697777652e-05}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.376081332385699e-07}, "ground_truth": 1}, {"key": "34492745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.89723626123456e-07}, "ground_truth": 0}, {"key": "34492745", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989946090444958, "res": {"Yes": 0.9989946090444958, "No": 0.0010053159588146994}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 1.0738427369714752e-06}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999936078174301, "res": {"Yes": 0.9999936078174301, "No": 6.374053171933014e-06}, "ground_truth": 1}, {"key": "34191937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999806147848957, "res": {"Yes": 0.9999806147848957, "No": 1.9351705554913578e-05}, "ground_truth": 0}, {"key": "34191937", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 7.547992629019415e-07}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8388746900388768, "res": {"Yes": 0.8388746900388768, "No": 0.16112522843074578}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9835619330954462, "res": {"Yes": 0.9835619330954462, "No": 0.01643789892725405}, "ground_truth": 1}, {"key": "34933372", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997155827542556, "res": {"Yes": 0.9997155827542556, "No": 0.0002843696732110602}, "ground_truth": 0}, {"key": "34933372", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.996669805140571, "res": {"Yes": 0.996669805140571, "No": 0.003330217705832162}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00020729285625881535, "res": {"No": 0.9997926665865435, "Yes": 0.00020729285625881535}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0012266419072256857, "res": {"No": 0.9987731449028249, "Yes": 0.0012266419072256857}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4391299043493444, "res": {"No": 0.5608699267324491, "Yes": 0.4391299043493444}, "ground_truth": 1}, {"key": "38714379", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 2.041758917775179e-07, "res": {"No": 0.9999995679800934, "Yes": 2.041758917775179e-07}, "ground_truth": 0}, {"key": "38714379", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00011510163929308755, "res": {"No": 0.9998847814881626, "Yes": 0.00011510163929308755}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9824383846791584, "res": {"Yes": 0.9824383846791584, "No": 0.01756160489534712}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.945093050687412, "res": {"Yes": 0.945093050687412, "No": 0.05490682067627834}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9786330871497309, "res": {"Yes": 0.9786330871497309, "No": 0.02136689109740674}, "ground_truth": 1}, {"key": "39220660", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9112601929890165, "res": {"Yes": 0.9112601929890165, "No": 0.08873974558556881}, "ground_truth": 0}, {"key": "39220660", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.17583860881689234, "res": {"No": 0.824161329507025, "Yes": 0.17583860881689234}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.07999817956537315, "res": {"No": 0.9200015630252547, "Yes": 0.07999817956537315}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999561788061766, "res": {"Yes": 0.9999561788061766, "No": 4.379571834677544e-05}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9937228461657512, "res": {"Yes": 0.9937228461657512, "No": 0.006277157678003}, "ground_truth": 1}, {"key": "41028780", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996835339659427, "res": {"Yes": 0.9996835339659427, "No": 0.00031638934448262237}, "ground_truth": 0}, {"key": "41028780", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999570131939592, "res": {"Yes": 0.9999570131939592, "No": 4.2862081671552446e-05}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.4137314695003176, "res": {"No": 0.5862682673782883, "Yes": 0.4137314695003176}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999897933310884, "res": {"Yes": 0.9999897933310884, "No": 1.0114656979306674e-05}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 4.7893266955837975e-09}, "ground_truth": 1}, {"key": "39457108", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 4.433541693337422e-08}, "ground_truth": 0}, {"key": "39457108", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999142218341572, "res": {"Yes": 0.9999142218341572, "No": 8.573735040009634e-05}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 9.756664187776926e-06, "res": {"No": 0.9999896741293122, "Yes": 9.756664187776926e-06}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.998692641538644, "res": {"Yes": 0.998692641538644, "No": 0.0013073122068353814}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998041078293773, "res": {"Yes": 0.9998041078293773, "No": 0.00019577940837937902}, "ground_truth": 1}, {"key": "38288018", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9981619390069084, "res": {"Yes": 0.9981619390069084, "No": 0.0018380916358636398}, "ground_truth": 0}, {"key": "38288018", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.03544227366394258, "res": {"No": 0.9645576717219178, "Yes": 0.03544227366394258}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 4.500648353575238e-05, "res": {"No": 0.9999548676244963, "Yes": 4.500648353575238e-05}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999862172649827, "res": {"Yes": 0.9999862172649827, "No": 1.3674729369726875e-05}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9929666164343777, "res": {"Yes": 0.9929666164343777, "No": 0.007033342667756049}, "ground_truth": 1}, {"key": "40106293", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999871708812939, "res": {"Yes": 0.9999871708812939, "No": 1.271402300536884e-05}, "ground_truth": 0}, {"key": "40106293", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9628483588777245, "res": {"Yes": 0.9628483588777245, "No": 0.0371515420474557}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.07724747884867217, "res": {"No": 0.9227524287476612, "Yes": 0.07724747884867217}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9981436446629096, "res": {"Yes": 0.9981436446629096, "No": 0.001856342732052087}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999937270200753, "res": {"Yes": 0.9999937270200753, "No": 6.2153407964483e-06}, "ground_truth": 1}, {"key": "39948797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.974044576460793, "res": {"Yes": 0.974044576460793, "No": 0.02595532728690342}, "ground_truth": 0}, {"key": "39948797", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9983063782985958, "res": {"Yes": 0.9983063782985958, "No": 0.0016935607735343132}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00010693172620585043, "res": {"No": 0.9998928864370674, "Yes": 0.00010693172620585043}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.23737834934919885, "res": {"No": 0.7626215678216289, "Yes": 0.23737834934919885}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999978707566687, "res": {"Yes": 0.999978707566687, "No": 2.1226354745135017e-05}, "ground_truth": 1}, {"key": "31853399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988174957098591, "res": {"Yes": 0.9988174957098591, "No": 0.001182509267996174}, "ground_truth": 0}, {"key": "31853399", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998751344763485, "res": {"Yes": 0.9998751344763485, "No": 0.00012480088633635985}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.03134461490572635, "res": {"No": 0.9686553270560982, "Yes": 0.03134461490572635}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7086222762900154, "res": {"Yes": 0.7086222762900154, "No": 0.29137767530862047}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7601523007915172, "res": {"Yes": 0.7601523007915172, "No": 0.2398476617219182}, "ground_truth": 1}, {"key": "35273252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994131811055954, "res": {"Yes": 0.9994131811055954, "No": 0.0005868114495745883}, "ground_truth": 0}, {"key": "35273252", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8806410947394709, "res": {"Yes": 0.8806410947394709, "No": 0.11935878761014268}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.20223815315753454, "res": {"No": 0.7977618018602209, "Yes": 0.20223815315753454}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.2926174074076843, "res": {"No": 0.7073825785164165, "Yes": 0.2926174074076843}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9956934773779539, "res": {"Yes": 0.9956934773779539, "No": 0.00430643570329396}, "ground_truth": 1}, {"key": "37130459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998275829655257, "res": {"Yes": 0.9998275829655257, "No": 0.0001723436688392796}, "ground_truth": 0}, {"key": "37130459", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995264250920127, "res": {"Yes": 0.9995264250920127, "No": 0.000473552867018733}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9836694285186319, "res": {"Yes": 0.9836694285186319, "No": 0.01633056946968535}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999740587314805, "res": {"Yes": 0.9999740587314805, "No": 2.582150205882083e-05}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999310282486606, "res": {"Yes": 0.9999310282486606, "No": 6.891518585145421e-05}, "ground_truth": 1}, {"key": "21734003", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.2941092901392254e-07}, "ground_truth": 0}, {"key": "21734003", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999596355646657, "res": {"Yes": 0.9999596355646657, "No": 4.028406808720325e-05}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.012977762021781792, "res": {"No": 0.98702213031662, "Yes": 0.012977762021781792}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9706200809618242, "res": {"Yes": 0.9706200809618242, "No": 0.029379812210585755}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998853774396677, "res": {"Yes": 0.9998853774396677, "No": 0.00011456158721137722}, "ground_truth": 1}, {"key": "33990737", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974442528968954, "res": {"Yes": 0.9974442528968954, "No": 0.00255573097590392}, "ground_truth": 0}, {"key": "33990737", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.019043270393580582, "res": {"No": 0.9809567167007478, "Yes": 0.019043270393580582}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.07376764191220818, "res": {"No": 0.9262322368922449, "Yes": 0.07376764191220818}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998282980724635, "res": {"Yes": 0.9998282980724635, "No": 0.0001715782718239655}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996822231417649, "res": {"Yes": 0.9996822231417649, "No": 0.0003177305059665505}, "ground_truth": 1}, {"key": "34559912", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995155827379468, "res": {"Yes": 0.9995155827379468, "No": 0.00048440220222562306}, "ground_truth": 0}, {"key": "34559912", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.992604372242693, "res": {"Yes": 0.992604372242693, "No": 0.007395618860342901}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7359906677655652, "res": {"Yes": 0.7359906677655652, "No": 0.2640089961739319}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999877668918251, "res": {"Yes": 0.9999877668918251, "No": 1.2166333134772973e-05}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9833858745480759, "res": {"Yes": 0.9833858745480759, "No": 0.016614109080659276}, "ground_truth": 1}, {"key": "39820439", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999551060207649, "res": {"Yes": 0.9999551060207649, "No": 4.479356801250951e-05}, "ground_truth": 0}, {"key": "39820439", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999495037169802, "res": {"Yes": 0.9999495037169802, "No": 5.041322583254248e-05}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998694134371675, "res": {"Yes": 0.9998694134371675, "No": 0.00013056609295284926}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7660147757015296, "res": {"Yes": 0.7660147757015296, "No": 0.23398517975745312}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996933056203395, "res": {"Yes": 0.9996933056203395, "No": 0.00030657289516021}, "ground_truth": 1}, {"key": "34759328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.741621082001594e-07}, "ground_truth": 0}, {"key": "34759328", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.07194086621422749, "res": {"No": 0.9280591676359607, "Yes": 0.07194086621422749}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9026444194734121, "res": {"Yes": 0.9026444194734121, "No": 0.09735552449315661}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991054950682727, "res": {"Yes": 0.9991054950682727, "No": 0.0008945086364530573}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9984568117414185, "res": {"Yes": 0.9984568117414185, "No": 0.0015431023129344403}, "ground_truth": 1}, {"key": "36939137", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997030736913445, "res": {"Yes": 0.9997030736913445, "No": 0.0002968095116043741}, "ground_truth": 0}, {"key": "36939137", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.003270689369273555, "res": {"No": 0.996729257569909, "Yes": 0.003270689369273555}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.02981764340795252, "res": {"No": 0.9701822990284006, "Yes": 0.02981764340795252}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9972119712910591, "res": {"Yes": 0.9972119712910591, "No": 0.0027880217076863088}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995856210186951, "res": {"Yes": 0.9995856210186951, "No": 0.00041435701528217886}, "ground_truth": 1}, {"key": "35851522", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.5407587171163735e-08}, "ground_truth": 0}, {"key": "35851522", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999256644730222, "res": {"Yes": 0.9999256644730222, "No": 7.427939250200152e-05}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9365166811783342, "res": {"Yes": 0.9365166811783342, "No": 0.06348326189720585}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998837087823479, "res": {"Yes": 0.9998837087823479, "No": 0.00011622041970805615}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999820452021894, "res": {"Yes": 0.9999820452021894, "No": 1.7907534712966782e-05}, "ground_truth": 1}, {"key": "22412782", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 7.529183861105073e-07}, "ground_truth": 0}, {"key": "22412782", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999573707926505, "res": {"Yes": 0.9999573707926505, "No": 4.259707368026262e-05}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.003599440004231676, "res": {"No": 0.9964004882302525, "Yes": 0.003599440004231676}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9836401283937481, "res": {"Yes": 0.9836401283937481, "No": 0.01635969485297713}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6643046264078684, "res": {"Yes": 0.6643046264078684, "No": 0.3356952582696954}, "ground_truth": 1}, {"key": "38579227", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7792685388388294, "res": {"Yes": 0.7792685388388294, "No": 0.22073126783901997}, "ground_truth": 0}, {"key": "38579227", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.10958622463548615, "res": {"No": 0.8904136526263898, "Yes": 0.10958622463548615}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.940846405951852, "res": {"Yes": 0.940846405951852, "No": 0.05915354251426736}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9942875229020072, "res": {"Yes": 0.9942875229020072, "No": 0.005712497273777515}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8221745405751785, "res": {"Yes": 0.8221745405751785, "No": 0.17782534824616292}, "ground_truth": 1}, {"key": "37206995", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9349019046595624, "res": {"Yes": 0.9349019046595624, "No": 0.06509805547691346}, "ground_truth": 0}, {"key": "37206995", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.14416719161857916, "res": {"No": 0.8558326707881039, "Yes": 0.14416719161857916}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9845944297968594, "res": {"Yes": 0.9845944297968594, "No": 0.015405504474770612}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.2235339220355453, "res": {"No": 0.776465971715098, "Yes": 0.2235339220355453}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.051314736851425756, "res": {"No": 0.9486850795171129, "Yes": 0.051314736851425756}, "ground_truth": 1}, {"key": "38700847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7924082759938119, "res": {"Yes": 0.7924082759938119, "No": 0.2075915566002352}, "ground_truth": 0}, {"key": "38700847", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9780094269359115, "res": {"Yes": 0.9780094269359115, "No": 0.021990549194253996}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9371422256018571, "res": {"Yes": 0.9371422256018571, "No": 0.06285770864469824}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978565611528869, "res": {"Yes": 0.9978565611528869, "No": 0.002143451282927526}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.6311488027967987e-06}, "ground_truth": 1}, {"key": "20246590", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998498667711213, "res": {"Yes": 0.9998498667711213, "No": 0.00015004579656986616}, "ground_truth": 0}, {"key": "20246590", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9741894841617208, "res": {"Yes": 0.9741894841617208, "No": 0.02581038367499588}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9939409162346607, "res": {"Yes": 0.9939409162346607, "No": 0.006059075792621892}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999840716318578, "res": {"Yes": 0.9999840716318578, "No": 1.585886354099392e-05}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990784823883839, "res": {"Yes": 0.9990784823883839, "No": 0.0009214574100415694}, "ground_truth": 1}, {"key": "39141360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9818273477897418, "res": {"Yes": 0.9818273477897418, "No": 0.01817271473853189}, "ground_truth": 0}, {"key": "39141360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999846676395419, "res": {"Yes": 0.9999846676395419, "No": 1.5256224107192916e-05}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.004825123252296665, "res": {"No": 0.9951749093311297, "Yes": 0.004825123252296665}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.29933875112054453, "res": {"No": 0.7006612829141713, "Yes": 0.29933875112054453}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.35749650254029486, "res": {"No": 0.6425034195307995, "Yes": 0.35749650254029486}, "ground_truth": 1}, {"key": "37906226", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999224462174501, "res": {"Yes": 0.9999224462174501, "No": 7.749989317445897e-05}, "ground_truth": 0}, {"key": "37906226", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9981061202577705, "res": {"Yes": 0.9981061202577705, "No": 0.0018939103860294616}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.448959384848147e-06, "res": {"No": 0.9999964686909351, "Yes": 3.448959384848147e-06}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 7.72033490021296e-08}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 6.575671163534501e-07}, "ground_truth": 1}, {"key": "16201033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 6.889494698535538e-08}, "ground_truth": 0}, {"key": "16201033", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.0620007732834462e-07}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.002078091613361433, "res": {"No": 0.9979218493513732, "Yes": 0.002078091613361433}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999988005296937, "res": {"Yes": 0.999988005296937, "No": 1.1962545471764405e-05}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998895490961502, "res": {"Yes": 0.9998895490961502, "No": 0.00011031793973578664}, "ground_truth": 1}, {"key": "36469022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9770005363138964, "res": {"Yes": 0.9770005363138964, "No": 0.022999389658317052}, "ground_truth": 0}, {"key": "36469022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9963396591398139, "res": {"Yes": 0.9963396591398139, "No": 0.0036603932206638154}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.706526718115057, "res": {"Yes": 0.706526718115057, "No": 0.2934733043701943}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.98566130149827, "res": {"Yes": 0.98566130149827, "No": 0.014338592509323001}, "ground_truth": 1}, {"key": "31295270", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997929049571395, "res": {"Yes": 0.9997929049571395, "No": 0.00020699663931995416}, "ground_truth": 0}, {"key": "31295270", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9027710964528792, "res": {"Yes": 0.9027710964528792, "No": 0.09722887925186173}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8928726655876147, "res": {"Yes": 0.8928726655876147, "No": 0.10712729272066107}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999917005724405, "res": {"Yes": 0.9999917005724405, "No": 8.229732885490531e-06}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999913429644723, "res": {"Yes": 0.9999913429644723, "No": 8.568318948184063e-06}, "ground_truth": 1}, {"key": "35360689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996815081293073, "res": {"Yes": 0.9996815081293073, "No": 0.0003183950979494406}, "ground_truth": 0}, {"key": "35360689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8738932765439391, "res": {"Yes": 0.8738932765439391, "No": 0.12610677629308417}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9089176572422139, "res": {"Yes": 0.9089176572422139, "No": 0.0910822804701522}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.459886036011744e-07}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999963494876631, "res": {"Yes": 0.9999963494876631, "No": 3.589347955338039e-06}, "ground_truth": 1}, {"key": "29202793", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999932502087799, "res": {"Yes": 0.9999932502087799, "No": 6.65908813135472e-06}, "ground_truth": 0}, {"key": "29202793", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999976607241361, "res": {"Yes": 0.9999976607241361, "No": 2.2842130298675293e-06}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9784429190533446, "res": {"Yes": 0.9784429190533446, "No": 0.02155707952803364}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 6.911064313022114e-07}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 1.4788366685901649e-08}, "ground_truth": 1}, {"key": "35999008", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999922965856715, "res": {"Yes": 0.9999922965856715, "No": 7.60870934760946e-06}, "ground_truth": 0}, {"key": "35999008", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9996390970411464, "res": {"Yes": 0.9996390970411464, "No": 0.0003608699189089774}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00012222633830991116, "res": {"No": 0.9998776374469079, "Yes": 0.00012222633830991116}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999765736184054, "res": {"Yes": 0.999765736184054, "No": 0.000234161619357963}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.630671185586656e-07}, "ground_truth": 1}, {"key": "31797119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999950382530095, "res": {"Yes": 0.9999950382530095, "No": 4.902280759591527e-06}, "ground_truth": 0}, {"key": "31797119", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.99986464592119, "res": {"Yes": 0.99986464592119, "No": 0.0001352172248140002}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.005538030205626759, "res": {"No": 0.994461967355785, "Yes": 0.005538030205626759}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.10890542869611342, "res": {"No": 0.8910944790853846, "Yes": 0.10890542869611342}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.02871078910086362, "res": {"No": 0.9712888821499126, "Yes": 0.02871078910086362}, "ground_truth": 1}, {"key": "26711893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.549289227582047, "res": {"Yes": 0.549289227582047, "No": 0.45071059575953926}, "ground_truth": 0}, {"key": "26711893", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9739657502229667, "res": {"Yes": 0.9739657502229667, "No": 0.026034143263878654}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.010753854828374739, "res": {"No": 0.9892460130501842, "Yes": 0.010753854828374739}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8959736364903189, "res": {"Yes": 0.8959736364903189, "No": 0.10402635484219137}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999924157887603, "res": {"Yes": 0.9999924157887603, "No": 7.543079783432785e-06}, "ground_truth": 1}, {"key": "35348288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999931310055916, "res": {"Yes": 0.9999931310055916, "No": 6.7506551400800615e-06}, "ground_truth": 0}, {"key": "35348288", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999988005296937, "res": {"Yes": 0.999988005296937, "No": 1.1957988610076927e-05}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.04483645691808112, "res": {"No": 0.9551634417032115, "Yes": 0.04483645691808112}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9991209631794276, "res": {"Yes": 0.9991209631794276, "No": 0.0008790466412227135}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999290019304823, "res": {"Yes": 0.9999290019304823, "No": 7.093631892092655e-05}, "ground_truth": 1}, {"key": "38124131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998206703614823, "res": {"Yes": 0.9998206703614823, "No": 0.00017931652816117582}, "ground_truth": 0}, {"key": "38124131", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999911045595646, "res": {"Yes": 0.9999911045595646, "No": 8.778737090622174e-06}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0017428945733788646, "res": {"No": 0.9982570816493571, "Yes": 0.0017428945733788646}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.24900039404715174, "res": {"No": 0.7509995548208517, "Yes": 0.24900039404715174}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9880802093271199, "res": {"Yes": 0.9880802093271199, "No": 0.011919646188002666}, "ground_truth": 1}, {"key": "20285901", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995535800050717, "res": {"Yes": 0.9995535800050717, "No": 0.0004464036367897124}, "ground_truth": 0}, {"key": "20285901", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.000244313334184736, "res": {"No": 0.9997556172963189, "Yes": 0.000244313334184736}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9976240882569266, "res": {"Yes": 0.9976240882569266, "No": 0.0023759521893776474}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999421134904887, "res": {"Yes": 0.9999421134904887, "No": 5.7754112440895695e-05}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999790651681366, "res": {"Yes": 0.9999790651681366, "No": 2.081888605106784e-05}, "ground_truth": 1}, {"key": "35633632", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.000936029467135367, "res": {"No": 0.9990639640552105, "Yes": 0.000936029467135367}, "ground_truth": 0}, {"key": "35633632", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9967669207928772, "res": {"Yes": 0.9967669207928772, "No": 0.00323310113059386}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9995489331912348, "res": {"Yes": 0.9995489331912348, "No": 0.00045100248883304706}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.915982247458163, "res": {"Yes": 0.915982247458163, "No": 0.08401770739777949}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7244767853788368, "res": {"Yes": 0.7244767853788368, "No": 0.27552321196001034}, "ground_truth": 1}, {"key": "10741274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999910407653634, "res": {"Yes": 0.999910407653634, "No": 8.947985874182448e-05}, "ground_truth": 0}, {"key": "10741274", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9368241713431056, "res": {"Yes": 0.9368241713431056, "No": 0.06317574077593831}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.027879754464425213, "res": {"No": 0.9721199993698104, "Yes": 0.027879754464425213}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999630923381045, "res": {"Yes": 0.9999630923381045, "No": 3.6792961303877276e-05}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9888386868435817, "res": {"Yes": 0.9888386868435817, "No": 0.011161226797268116}, "ground_truth": 1}, {"key": "30605795", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999967070975216, "res": {"Yes": 0.9999967070975216, "No": 3.2181464525626138e-06}, "ground_truth": 0}, {"key": "30605795", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9818625106021873, "res": {"Yes": 0.9818625106021873, "No": 0.018137559142345508}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9951815232855553, "res": {"Yes": 0.9951815232855553, "No": 0.0048184759204396915}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978575091170703, "res": {"Yes": 0.9978575091170703, "No": 0.0021424719494859638}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999961110815618, "res": {"Yes": 0.9999961110815618, "No": 3.7848057250043615e-06}, "ground_truth": 1}, {"key": "30539722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999940846288958, "res": {"Yes": 0.9999940846288958, "No": 5.893579617478215e-06}, "ground_truth": 0}, {"key": "30539722", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 3.025962001540462e-06}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.021755743224615782, "res": {"No": 0.9782441529111969, "Yes": 0.021755743224615782}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999603507610518, "res": {"Yes": 0.9999603507610518, "No": 3.960674998748861e-05}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9983053109099868, "res": {"Yes": 0.9983053109099868, "No": 0.0016947161759292971}, "ground_truth": 1}, {"key": "18639299", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999673835219289, "res": {"Yes": 0.9999673835219289, "No": 3.2488414795796037e-05}, "ground_truth": 0}, {"key": "18639299", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994547413575521, "res": {"Yes": 0.9994547413575521, "No": 0.0005452121352740158}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9904565515249837, "res": {"Yes": 0.9904565515249837, "No": 0.009543340476904865}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989835452404665, "res": {"Yes": 0.9989835452404665, "No": 0.001016406409965377}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993949648076534, "res": {"Yes": 0.9993949648076534, "No": 0.0006049571069803039}, "ground_truth": 1}, {"key": "39773552", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999860980626328, "res": {"Yes": 0.9999860980626328, "No": 1.3783104878718962e-05}, "ground_truth": 0}, {"key": "39773552", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.994487793868433, "res": {"Yes": 0.994487793868433, "No": 0.005512163958371019}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.523400907043283e-06, "res": {"No": 0.9999973031140366, "Yes": 2.523400907043283e-06}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999871708812939, "res": {"Yes": 0.9999871708812939, "No": 1.2772642232049702e-05}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.85094252734951e-07}, "ground_truth": 1}, {"key": "34086410", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 7.131643722361078e-08}, "ground_truth": 0}, {"key": "34086410", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.67231470923038e-07}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.02488243117121991, "res": {"No": 0.9751175228419947, "Yes": 0.02488243117121991}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0011443753919891284, "res": {"No": 0.9988555561759083, "Yes": 0.0011443753919891284}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9913411139725521, "res": {"Yes": 0.9913411139725521, "No": 0.008658835796753075}, "ground_truth": 1}, {"key": "35454652", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999992773397112, "res": {"Yes": 0.999992773397112, "No": 7.190959110967855e-06}, "ground_truth": 0}, {"key": "35454652", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9935011222485626, "res": {"Yes": 0.9935011222485626, "No": 0.00649885026521939}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.945832003612414e-07, "res": {"No": 0.9999995679800934, "Yes": 1.945832003612414e-07}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999002763027385, "res": {"Yes": 0.9999002763027385, "No": 9.962544042854282e-05}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995523885079278, "res": {"Yes": 0.9995523885079278, "No": 0.00044750108306290106}, "ground_truth": 1}, {"key": "36158310", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999843100330889, "res": {"Yes": 0.9999843100330889, "No": 1.5613853389384378e-05}, "ground_truth": 0}, {"key": "36158310", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999806147848957, "res": {"Yes": 0.9999806147848957, "No": 1.9285597194420647e-05}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.720319869295958e-07, "res": {"No": 0.9999993295729247, "Yes": 3.720319869295958e-07}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999744163342675, "res": {"Yes": 0.9999744163342675, "No": 2.5538690019567802e-05}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999641651360841, "res": {"Yes": 0.9999641651360841, "No": 3.572838811060128e-05}, "ground_truth": 1}, {"key": "35688387", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996257621544586, "res": {"Yes": 0.9996257621544586, "No": 0.0003742140118536365}, "ground_truth": 0}, {"key": "35688387", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999782307609533, "res": {"Yes": 0.9999782307609533, "No": 2.1737493006696826e-05}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 6.753330184929646e-08}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.12755952083396e-06}, "ground_truth": 1}, {"key": "34209292", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 2.030003582771634e-06}, "ground_truth": 0}, {"key": "34209292", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.7171647987842632e-06}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.239613401428722e-06, "res": {"No": 0.99999861435166, "Yes": 1.239613401428722e-06}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993623453282058, "res": {"Yes": 0.9993623453282058, "No": 0.0006375505435974993}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999760851449647, "res": {"Yes": 0.9999760851449647, "No": 2.3835416384580886e-05}, "ground_truth": 1}, {"key": "25037859", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998340188763911, "res": {"Yes": 0.9998340188763911, "No": 0.00016588148008518444}, "ground_truth": 0}, {"key": "25037859", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998447454732317, "res": {"Yes": 0.9998447454732317, "No": 0.00015512411802993503}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.32201169957949033, "res": {"No": 0.677987654438701, "Yes": 0.32201169957949033}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.986639727415484, "res": {"Yes": 0.986639727415484, "No": 0.013359845170168963}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998125696772581, "res": {"Yes": 0.9998125696772581, "No": 0.00018725860163246953}, "ground_truth": 1}, {"key": "36412121", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993546093541943, "res": {"Yes": 0.9993546093541943, "No": 0.0006451691677340863}, "ground_truth": 0}, {"key": "36412121", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971289986296773, "res": {"Yes": 0.9971289986296773, "No": 0.0028706924687598567}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9154720455130609, "res": {"Yes": 0.9154720455130609, "No": 0.0845278680147177}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9877460694449971, "res": {"Yes": 0.9877460694449971, "No": 0.012253826786996687}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986265447541659, "res": {"Yes": 0.9986265447541659, "No": 0.0013734568074403107}, "ground_truth": 1}, {"key": "34909172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999775155557789, "res": {"Yes": 0.9999775155557789, "No": 2.2365812335694557e-05}, "ground_truth": 0}, {"key": "34909172", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9985053033733617, "res": {"Yes": 0.9985053033733617, "No": 0.0014946264045364354}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9525488073326029, "res": {"Yes": 0.9525488073326029, "No": 0.047451207804169816}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.892308601881304, "res": {"Yes": 0.892308601881304, "No": 0.10769121148069108}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8167290739087371, "res": {"Yes": 0.8167290739087371, "No": 0.18327075207790966}, "ground_truth": 1}, {"key": "39011806", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9862105644204441, "res": {"Yes": 0.9862105644204441, "No": 0.013789342055866134}, "ground_truth": 0}, {"key": "39011806", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.3024674834549214, "res": {"No": 0.6975324102903858, "Yes": 0.3024674834549214}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.15292153993569188, "res": {"No": 0.847078447970227, "Yes": 0.15292153993569188}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999821644040562, "res": {"Yes": 0.9999821644040562, "No": 1.7762216948665765e-05}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995410766075692, "res": {"Yes": 0.9995410766075692, "No": 0.00045886183788585214}, "ground_truth": 1}, {"key": "33096163", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998267486897419, "res": {"Yes": 0.9998267486897419, "No": 0.00017321672531748548}, "ground_truth": 0}, {"key": "33096163", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9761476278152064, "res": {"Yes": 0.9761476278152064, "No": 0.02385235081114772}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6584644536799537, "res": {"Yes": 0.6584644536799537, "No": 0.34153517630174424}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998988460004109, "res": {"Yes": 0.9998988460004109, "No": 0.00010093336614364545}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998922904870862, "res": {"Yes": 0.9998922904870862, "No": 0.00010757293234657215}, "ground_truth": 1}, {"key": "38762205", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999856212553752, "res": {"Yes": 0.9999856212553752, "No": 1.4316010952610224e-05}, "ground_truth": 0}, {"key": "38762205", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999953079650794, "res": {"Yes": 0.999953079650794, "No": 4.682421848013968e-05}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0007495369066046461, "res": {"No": 0.9992500948195406, "Yes": 0.0007495369066046461}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999972151525776, "res": {"Yes": 0.999972151525776, "No": 2.7739282738245437e-05}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999791117279034, "res": {"Yes": 0.999791117279034, "No": 0.00020868387727078716}, "ground_truth": 1}, {"key": "35519177", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9988282003939685, "res": {"Yes": 0.9988282003939685, "No": 0.001171494493982179}, "ground_truth": 0}, {"key": "35519177", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9899792942214993, "res": {"Yes": 0.9899792942214993, "No": 0.01002037659199744}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 8.764298360007689e-05, "res": {"No": 0.9999123147445768, "Yes": 8.764298360007689e-05}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.2538342713291983, "res": {"No": 0.7461657040893254, "Yes": 0.2538342713291983}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996921139466417, "res": {"Yes": 0.9996921139466417, "No": 0.00030784627707149326}, "ground_truth": 1}, {"key": "36192531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999911045595646, "res": {"Yes": 0.9999911045595646, "No": 8.84226051179514e-06}, "ground_truth": 0}, {"key": "36192531", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999803763825457, "res": {"Yes": 0.9999803763825457, "No": 1.958593208890756e-05}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.997590273363929, "res": {"Yes": 0.997590273363929, "No": 0.0024096986037137583}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 4.2760416945794707e-08}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999982567412194, "res": {"Yes": 0.9999982567412194, "No": 1.6987209031776415e-06}, "ground_truth": 1}, {"key": "33160852", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.855790130230084e-06}, "ground_truth": 0}, {"key": "33160852", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.482109023825219, "res": {"No": 0.5178908620211492, "Yes": 0.482109023825219}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.5075581973802206, "res": {"Yes": 0.5075581973802206, "No": 0.4924417004980849}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.997395042505553, "res": {"Yes": 0.997395042505553, "No": 0.0026049565067016683}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9963262858604907, "res": {"Yes": 0.9963262858604907, "No": 0.0036736741019581954}, "ground_truth": 1}, {"key": "36312304", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999899125338788, "res": {"Yes": 0.9999899125338788, "No": 1.0001774807180676e-05}, "ground_truth": 0}, {"key": "36312304", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998070873500388, "res": {"Yes": 0.9998070873500388, "No": 0.00019287273320763352}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9972853613135009, "res": {"Yes": 0.9972853613135009, "No": 0.002714582806050623}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9858378305158284, "res": {"Yes": 0.9858378305158284, "No": 0.014162132525111745}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.906034851332811e-06}, "ground_truth": 1}, {"key": "33773343", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9914453936718592, "res": {"Yes": 0.9914453936718592, "No": 0.008554549776210294}, "ground_truth": 0}, {"key": "33773343", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999944422379444, "res": {"Yes": 0.9999944422379444, "No": 5.478731291269815e-06}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0021972875744377856, "res": {"No": 0.9978026772558504, "Yes": 0.0021972875744377856}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999309090568892, "res": {"Yes": 0.9999309090568892, "No": 6.907283709908085e-05}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.280650254131578e-07}, "ground_truth": 1}, {"key": "34913320", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 4.027934247875536e-07}, "ground_truth": 0}, {"key": "34913320", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.4774665852710063, "res": {"No": 0.522533386278906, "Yes": 0.4774665852710063}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999938462231346, "res": {"Yes": 0.9999938462231346, "No": 6.0832589139621636e-06}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.797739427984018e-08}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997825401078307, "res": {"Yes": 0.9997825401078307, "No": 0.0002173566511268445}, "ground_truth": 1}, {"key": "33784155", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 7.259025933953448e-07}, "ground_truth": 0}, {"key": "33784155", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999922965856715, "res": {"Yes": 0.9999922965856715, "No": 7.613588093772374e-06}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9926545224631992, "res": {"Yes": 0.9926545224631992, "No": 0.0073454103718854965}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9631604560844002, "res": {"Yes": 0.9631604560844002, "No": 0.03683951620537765}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999172016779703, "res": {"Yes": 0.9999172016779703, "No": 8.274830725907639e-05}, "ground_truth": 1}, {"key": "24085062", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999766811478886, "res": {"Yes": 0.9999766811478886, "No": 2.32674074161619e-05}, "ground_truth": 0}, {"key": "24085062", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995073763788804, "res": {"Yes": 0.9995073763788804, "No": 0.0004925222109467479}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.4384360758624315e-05, "res": {"No": 0.9999853828508316, "Yes": 1.4384360758624315e-05}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8411314745624469, "res": {"Yes": 0.8411314745624469, "No": 0.1588684146839298}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9992034360956046, "res": {"Yes": 0.9992034360956046, "No": 0.0007965603201251384}, "ground_truth": 1}, {"key": "33893487", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9980384403776247, "res": {"Yes": 0.9980384403776247, "No": 0.0019615594192751882}, "ground_truth": 0}, {"key": "33893487", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.3410627844584149, "res": {"No": 0.658937229601737, "Yes": 0.3410627844584149}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.03053466143917237, "res": {"No": 0.969465016513986, "Yes": 0.03053466143917237}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 4.1770679705734784e-06, "res": {"No": 0.9999951574563252, "Yes": 4.1770679705734784e-06}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9035362301275831, "res": {"Yes": 0.9035362301275831, "No": 0.0964634595363995}, "ground_truth": 1}, {"key": "40913011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9918834941577598, "res": {"Yes": 0.9918834941577598, "No": 0.00811650529369158}, "ground_truth": 0}, {"key": "40913011", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.017503192257043578, "res": {"No": 0.9824966037379131, "Yes": 0.017503192257043578}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8513566525732094, "res": {"Yes": 0.8513566525732094, "No": 0.14864335988413785}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.008026224788432698, "res": {"No": 0.9919736941924804, "Yes": 0.008026224788432698}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.00014455449405736107, "res": {"No": 0.9998553493529139, "Yes": 0.00014455449405736107}, "ground_truth": 1}, {"key": "29642545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9974023956281296, "res": {"Yes": 0.9974023956281296, "No": 0.002597642437794093}, "ground_truth": 0}, {"key": "29642545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999379416057018, "res": {"Yes": 0.9999379416057018, "No": 6.197856242804941e-05}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9883646246778821, "res": {"Yes": 0.9883646246778821, "No": 0.011635336049574318}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999641651360841, "res": {"Yes": 0.9999641651360841, "No": 3.580507195041212e-05}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998563028254281, "res": {"Yes": 0.9998563028254281, "No": 0.0001436514038320832}, "ground_truth": 1}, {"key": "35969159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999828796125555, "res": {"Yes": 0.9999828796125555, "No": 1.7079357284926664e-05}, "ground_truth": 0}, {"key": "35969159", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00023691029277040184, "res": {"No": 0.9997629951400903, "Yes": 0.00023691029277040184}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 5.16804543458889e-06, "res": {"No": 0.9999946806438478, "Yes": 5.16804543458889e-06}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994003221087031, "res": {"Yes": 0.9994003221087031, "No": 0.000599666434404928}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999877668918251, "res": {"Yes": 0.9999877668918251, "No": 1.2193043180197736e-05}, "ground_truth": 1}, {"key": "37081669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.5718457377102802e-06}, "ground_truth": 0}, {"key": "37081669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999766811478886, "res": {"Yes": 0.9999766811478886, "No": 2.330240462332131e-05}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.06074187199704856, "res": {"No": 0.9392579409490477, "Yes": 0.06074187199704856}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999936078174301, "res": {"Yes": 0.9999936078174301, "No": 6.26860322041762e-06}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998509394606263, "res": {"Yes": 0.9998509394606263, "No": 0.0001490344605351841}, "ground_truth": 1}, {"key": "40048022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9984755912931226, "res": {"Yes": 0.9984755912931226, "No": 0.001524415074812126}, "ground_truth": 0}, {"key": "40048022", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.002020367203861294, "res": {"No": 0.9979796655286942, "Yes": 0.002020367203861294}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00170656790233318, "res": {"No": 0.9982932021389849, "Yes": 0.00170656790233318}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999947998470209, "res": {"Yes": 0.9999947998470209, "No": 5.070384018173844e-06}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999836879295629, "res": {"Yes": 0.999836879295629, "No": 0.00016306559741258362}, "ground_truth": 1}, {"key": "32884004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.438420544508787e-07}, "ground_truth": 0}, {"key": "32884004", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9995657297826195, "res": {"Yes": 0.9995657297826195, "No": 0.0004342072080056479}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998652418606938, "res": {"Yes": 0.9998652418606938, "No": 0.00013466181453514103}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4607456988452887e-06}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9957458283344104, "res": {"Yes": 0.9957458283344104, "No": 0.004254215097054052}, "ground_truth": 1}, {"key": "39022490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9986988246636668, "res": {"Yes": 0.9986988246636668, "No": 0.0013011562327467346}, "ground_truth": 0}, {"key": "39022490", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9907324003857314, "res": {"Yes": 0.9907324003857314, "No": 0.009267593814815607}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9991595189422366, "res": {"Yes": 0.9991595189422366, "No": 0.0008403715016732839}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978641593606, "res": {"Yes": 0.9978641593606, "No": 0.0021358768799891103}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996226640291312, "res": {"Yes": 0.9996226640291312, "No": 0.00037730336967908693}, "ground_truth": 1}, {"key": "35159385", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999983759447187, "res": {"Yes": 0.9999983759447187, "No": 1.5488404558412024e-06}, "ground_truth": 0}, {"key": "35159385", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9648151503822446, "res": {"Yes": 0.9648151503822446, "No": 0.03518483897845459}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00011302590700480626, "res": {"No": 0.99988680771673, "Yes": 0.00011302590700480626}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9968548098061759, "res": {"Yes": 0.9968548098061759, "No": 0.0031451396059679598}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9687546600034577, "res": {"Yes": 0.9687546600034577, "No": 0.031245278569197926}, "ground_truth": 1}, {"key": "34363669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997752702855062, "res": {"Yes": 0.9997752702855062, "No": 0.00022462864184332363}, "ground_truth": 0}, {"key": "34363669", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.7373420376106247, "res": {"Yes": 0.7373420376106247, "No": 0.26265778285036456}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.0823758271344067e-05, "res": {"No": 0.9999889589149532, "Yes": 1.0823758271344067e-05}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9819995214004897, "res": {"Yes": 0.9819995214004897, "No": 0.01800036038315512}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9939249054663667, "res": {"Yes": 0.9939249054663667, "No": 0.006075111111280909}, "ground_truth": 1}, {"key": "36119687", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9905765545862727, "res": {"Yes": 0.9905765545862727, "No": 0.009423337064453413}, "ground_truth": 0}, {"key": "36119687", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9829197893274627, "res": {"Yes": 0.9829197893274627, "No": 0.017079991299821077}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.003344900606146238, "res": {"No": 0.9966551206148421, "Yes": 0.003344900606146238}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999976607241361, "res": {"Yes": 0.9999976607241361, "No": 2.240888766569693e-06}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999762043451211, "res": {"Yes": 0.9999762043451211, "No": 2.371787677159329e-05}, "ground_truth": 1}, {"key": "35217446", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999419942923962, "res": {"Yes": 0.9999419942923962, "No": 5.793435492721722e-05}, "ground_truth": 0}, {"key": "35217446", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999199431347219, "res": {"Yes": 0.9999199431347219, "No": 7.995948412629682e-05}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9978147764849105, "res": {"Yes": 0.9978147764849105, "No": 0.0021852267064598084}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9918617949599157, "res": {"Yes": 0.9918617949599157, "No": 0.008138215085320949}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.6991605554935038, "res": {"Yes": 0.6991605554935038, "No": 0.30083943352601383}, "ground_truth": 1}, {"key": "39049331", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5838133811775187, "res": {"Yes": 0.5838133811775187, "No": 0.4161866256373009}, "ground_truth": 0}, {"key": "39049331", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 7.752777381394956e-07, "res": {"No": 0.9999987335551019, "Yes": 7.752777381394956e-07}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999784691637917, "res": {"Yes": 0.9999784691637917, "No": 2.1448132056399207e-05}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.989200397000539, "res": {"Yes": 0.989200397000539, "No": 0.010799519895072846}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9389040858365779, "res": {"Yes": 0.9389040858365779, "No": 0.06109585834273754}, "ground_truth": 1}, {"key": "36472242", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999962302846054, "res": {"Yes": 0.9999962302846054, "No": 3.6499758749297696e-06}, "ground_truth": 0}, {"key": "36472242", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.5263893662857564, "res": {"Yes": 0.5263893662857564, "No": 0.47361062079437216}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.02875081972417568, "res": {"No": 0.9712490649783468, "Yes": 0.02875081972417568}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.3940240406098598e-06}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999576091905158, "res": {"Yes": 0.9999576091905158, "No": 4.231173869038247e-05}, "ground_truth": 1}, {"key": "31854721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.0343287348632409e-07}, "ground_truth": 0}, {"key": "31854721", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999773963544663, "res": {"Yes": 0.9999773963544663, "No": 2.2546380835411676e-05}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.735290004952545e-05, "res": {"No": 0.9999725091278809, "Yes": 2.735290004952545e-05}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4200819169812921e-06}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999943230348141, "res": {"Yes": 0.9999943230348141, "No": 5.553850983067602e-06}, "ground_truth": 1}, {"key": "18725849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998869269092439, "res": {"Yes": 0.9998869269092439, "No": 0.0001130521885832999}, "ground_truth": 0}, {"key": "18725849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9994545030375974, "res": {"Yes": 0.9994545030375974, "No": 0.0005454949556163448}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0052147000967345475, "res": {"No": 0.9947852190261032, "Yes": 0.0052147000967345475}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9941608478044985, "res": {"Yes": 0.9941608478044985, "No": 0.005839150237538597}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997918323398948, "res": {"Yes": 0.9997918323398948, "No": 0.00020808976684352296}, "ground_truth": 1}, {"key": "36883179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999547484278832, "res": {"Yes": 0.9999547484278832, "No": 4.517074116889054e-05}, "ground_truth": 0}, {"key": "36883179", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999959918780326, "res": {"Yes": 0.9999959918780326, "No": 3.944667070513302e-06}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.996509858352799, "res": {"Yes": 0.996509858352799, "No": 0.0034901711634567566}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999579667834204, "res": {"Yes": 0.9999579667834204, "No": 4.196036817695729e-05}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7611780576302423, "res": {"Yes": 0.7611780576302423, "No": 0.23882192224051682}, "ground_truth": 1}, {"key": "34266359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.78854897262288e-07}, "ground_truth": 0}, {"key": "34266359", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999961110815618, "res": {"Yes": 0.9999961110815618, "No": 3.814808847453319e-06}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9992080740390135, "res": {"Yes": 0.9992080740390135, "No": 0.0007918832409980059}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999965953125608, "res": {"Yes": 0.999965953125608, "No": 3.3929388558684204e-05}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999949190499081, "res": {"Yes": 0.9999949190499081, "No": 4.947263314637916e-06}, "ground_truth": 1}, {"key": "31920289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999931310055916, "res": {"Yes": 0.9999931310055916, "No": 6.811675042407107e-06}, "ground_truth": 0}, {"key": "31920289", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997154636081595, "res": {"Yes": 0.9997154636081595, "No": 0.00028448785336050497}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.20060902789607468, "res": {"No": 0.7993908570785935, "Yes": 0.20060902789607468}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.049864273229319266, "res": {"No": 0.9501355978445025, "Yes": 0.049864273229319266}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9958725537173374, "res": {"Yes": 0.9958725537173374, "No": 0.004127486718428008}, "ground_truth": 1}, {"key": "36292997", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999872900832717, "res": {"Yes": 0.9999872900832717, "No": 1.2585187887612002e-05}, "ground_truth": 0}, {"key": "36292997", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9389222538064135, "res": {"Yes": 0.9389222538064135, "No": 0.061077697243833357}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.251621143439462e-05, "res": {"No": 0.9999773963544663, "Yes": 2.251621143439462e-05}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9839298225695999, "res": {"Yes": 0.9839298225695999, "No": 0.0160701783656596}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999975415208221, "res": {"Yes": 0.9999975415208221, "No": 2.3755941104309612e-06}, "ground_truth": 1}, {"key": "30412533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9978643970518711, "res": {"Yes": 0.9978643970518711, "No": 0.002135568054520882}, "ground_truth": 0}, {"key": "30412533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.366183015272884e-07}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9657284035950484, "res": {"Yes": 0.9657284035950484, "No": 0.03427133460587356}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999641651360841, "res": {"Yes": 0.9999641651360841, "No": 3.5788963292754215e-05}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9699336062425035, "res": {"Yes": 0.9699336062425035, "No": 0.030066391274750057}, "ground_truth": 1}, {"key": "40433191", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987498392029135, "res": {"Yes": 0.9987498392029135, "No": 0.0012501191652646926}, "ground_truth": 0}, {"key": "40433191", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9992888939558291, "res": {"Yes": 0.9992888939558291, "No": 0.0007110349309805348}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999735819309633, "res": {"Yes": 0.9999735819309633, "No": 2.634652948500936e-05}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9995658489408572, "res": {"Yes": 0.9995658489408572, "No": 0.00043408464861090067}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999962302846054, "res": {"Yes": 0.9999962302846054, "No": 3.6915357281607014e-06}, "ground_truth": 1}, {"key": "34565591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.273289141902195e-08}, "ground_truth": 0}, {"key": "34565591", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0003894788478628905, "res": {"No": 0.9996105135895327, "Yes": 0.0003894788478628905}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.0205131183021065e-06, "res": {"No": 0.99999861435166, "Yes": 1.0205131183021065e-06}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999987886094374, "res": {"Yes": 0.999987886094374, "No": 1.2086952414625675e-05}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9997782497202287, "res": {"Yes": 0.9997782497202287, "No": 0.00022164157674483894}, "ground_truth": 1}, {"key": "36062480", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9987264113033415, "res": {"Yes": 0.9987264113033415, "No": 0.0012735105236677364}, "ground_truth": 0}, {"key": "36062480", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6435024143817518, "res": {"Yes": 0.6435024143817518, "No": 0.35649730455924583}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9960734727469776, "res": {"Yes": 0.9960734727469776, "No": 0.0039264875732335685}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.5326235444241817, "res": {"Yes": 0.5326235444241817, "No": 0.4673763300038535}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9719491351340188, "res": {"Yes": 0.9719491351340188, "No": 0.02805074745868549}, "ground_truth": 1}, {"key": "37276883", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990937118274238, "res": {"Yes": 0.9990937118274238, "No": 0.000906196217285541}, "ground_truth": 0}, {"key": "37276883", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.009415575432943643, "res": {"No": 0.9905843930495619, "Yes": 0.009415575432943643}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00031235287489034377, "res": {"No": 0.9996874664287948, "Yes": 0.00031235287489034377}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.5424759371690555, "res": {"Yes": 0.5424759371690555, "No": 0.4575238200220323}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9408487298453446, "res": {"Yes": 0.9408487298453446, "No": 0.059150975306231084}, "ground_truth": 1}, {"key": "38509260", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9084071071229686, "res": {"Yes": 0.9084071071229686, "No": 0.09159260884707805}, "ground_truth": 0}, {"key": "38509260", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.010292142900910739, "res": {"No": 0.9897075050022284, "Yes": 0.010292142900910739}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9009144139069668, "res": {"Yes": 0.9009144139069668, "No": 0.09908541728377764}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.945338868274529, "res": {"Yes": 0.945338868274529, "No": 0.054661098594077875}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9654998774911576, "res": {"Yes": 0.9654998774911576, "No": 0.03450008814570899}, "ground_truth": 1}, {"key": "37139607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994280693147415, "res": {"Yes": 0.9994280693147415, "No": 0.0005719202496463819}, "ground_truth": 0}, {"key": "37139607", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0014368809809282342, "res": {"No": 0.9985629445544788, "Yes": 0.0014368809809282342}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.008780136717386717, "res": {"No": 0.9912197594390812, "Yes": 0.008780136717386717}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990063873602695, "res": {"Yes": 0.9990063873602695, "No": 0.0009935813669803503}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.45095620528173425, "res": {"No": 0.549043722713421, "Yes": 0.45095620528173425}, "ground_truth": 1}, {"key": "37092824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9730654197097868, "res": {"Yes": 0.9730654197097868, "No": 0.026934488855305097}, "ground_truth": 0}, {"key": "37092824", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9278091311412501, "res": {"Yes": 0.9278091311412501, "No": 0.0721908624468865}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.017890513118704862, "res": {"No": 0.9821095439158319, "Yes": 0.017890513118704862}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9612455476563061, "res": {"Yes": 0.9612455476563061, "No": 0.03875433726604855}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.4481252991810104, "res": {"No": 0.551874695157531, "Yes": 0.4481252991810104}, "ground_truth": 1}, {"key": "32191802", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.29569046445673103, "res": {"No": 0.7043094779914066, "Yes": 0.29569046445673103}, "ground_truth": 0}, {"key": "32191802", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.7178826380853908, "res": {"Yes": 0.7178826380853908, "No": 0.2821173950971118}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.5314695359309617, "res": {"Yes": 0.5314695359309617, "No": 0.4685302413877543}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999212542766073, "res": {"Yes": 0.9999212542766073, "No": 7.864519687004677e-05}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999714363229496, "res": {"Yes": 0.9999714363229496, "No": 2.8500925429680158e-05}, "ground_truth": 1}, {"key": "39396038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.419724101424867e-06}, "ground_truth": 0}, {"key": "39396038", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999968263007362, "res": {"Yes": 0.9999968263007362, "No": 3.1042016288652067e-06}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.1004472091520463e-07}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999924157887603, "res": {"Yes": 0.9999924157887603, "No": 7.475249958368361e-06}, "ground_truth": 1}, {"key": "39076884", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998984884226488, "res": {"Yes": 0.9998984884226488, "No": 0.00010147216840391689}, "ground_truth": 0}, {"key": "39076884", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.000263214307549516, "res": {"No": 0.999736672396801, "Yes": 0.000263214307549516}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9978562042196588, "res": {"Yes": 0.9978562042196588, "No": 0.0021437363809067504}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999359152835132, "res": {"Yes": 0.9999359152835132, "No": 6.397417958464157e-05}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986915700418837, "res": {"Yes": 0.9986915700418837, "No": 0.0013083637084967032}, "ground_truth": 1}, {"key": "27763432", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.5744721556326062, "res": {"Yes": 0.5744721556326062, "No": 0.42552782051164145}, "ground_truth": 0}, {"key": "27763432", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988502019249353, "res": {"Yes": 0.9988502019249353, "No": 0.001149724420122548}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.18214460033938126, "res": {"No": 0.8178552451159063, "Yes": 0.18214460033938126}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9474569172312292, "res": {"Yes": 0.9474569172312292, "No": 0.052542926282326485}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.5423888713440352, "res": {"Yes": 0.5423888713440352, "No": 0.4576109545793326}, "ground_truth": 1}, {"key": "37806929", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9867296824732867, "res": {"Yes": 0.9867296824732867, "No": 0.01327029102275768}, "ground_truth": 0}, {"key": "37806929", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.19390108908769021, "res": {"No": 0.8060987382066778, "Yes": 0.19390108908769021}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.17358022405131354, "res": {"No": 0.8264196943191002, "Yes": 0.17358022405131354}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999877668918251, "res": {"Yes": 0.9999877668918251, "No": 1.2117231833324108e-05}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999965878943212, "res": {"Yes": 0.9999965878943212, "No": 3.2784001949394933e-06}, "ground_truth": 1}, {"key": "32334186", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 6.488320087829676e-07}, "ground_truth": 0}, {"key": "32334186", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9986436645554916, "res": {"Yes": 0.9986436645554916, "No": 0.0013563554398895834}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.017263731900212954, "res": {"No": 0.9827361253191282, "Yes": 0.017263731900212954}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.994282215111091, "res": {"Yes": 0.994282215111091, "No": 0.005717720883111564}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8869859559497408, "res": {"Yes": 0.8869859559497408, "No": 0.11301392926893207}, "ground_truth": 1}, {"key": "36187324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999783499623655, "res": {"Yes": 0.9999783499623655, "No": 2.1530522035368464e-05}, "ground_truth": 0}, {"key": "36187324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9938849817956438, "res": {"Yes": 0.9938849817956438, "No": 0.006114972542751598}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.4933646614347664, "res": {"No": 0.5066351954411416, "Yes": 0.4933646614347664}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9968697350274908, "res": {"Yes": 0.9968697350274908, "No": 0.0031302481388015358}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.996462627296465, "res": {"Yes": 0.996462627296465, "No": 0.0035373585594729094}, "ground_truth": 1}, {"key": "35306009", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9595593848458712, "res": {"Yes": 0.9595593848458712, "No": 0.04044024607126844}, "ground_truth": 0}, {"key": "35306009", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.25884884440149913, "res": {"No": 0.7411509375718471, "Yes": 0.25884884440149913}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4499695525407733e-06}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999980183344636, "res": {"Yes": 0.9999980183344636, "No": 1.8781731167192466e-06}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.349174326823101e-07}, "ground_truth": 1}, {"key": "39490050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999942038320978, "res": {"Yes": 0.9999942038320978, "No": 5.7415692298751285e-06}, "ground_truth": 0}, {"key": "39490050", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989471433429107, "res": {"Yes": 0.9989471433429107, "No": 0.0010528452686287934}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9987597061010635, "res": {"Yes": 0.9987597061010635, "No": 0.0012402746896335044}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993727057913305, "res": {"Yes": 0.9993727057913305, "No": 0.0006271919022279647}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998572563188488, "res": {"Yes": 0.9998572563188488, "No": 0.00014268545011962065}, "ground_truth": 1}, {"key": "38072149", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999845484373766, "res": {"Yes": 0.9999845484373766, "No": 1.5356772131771345e-05}, "ground_truth": 0}, {"key": "38072149", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9892006334194621, "res": {"Yes": 0.9892006334194621, "No": 0.010799321185734907}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9822865261792882, "res": {"Yes": 0.9822865261792882, "No": 0.017713491466608954}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.22887002797063682, "res": {"No": 0.7711299132018334, "Yes": 0.22887002797063682}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996703102896007, "res": {"Yes": 0.9996703102896007, "No": 0.00032956531469775845}, "ground_truth": 1}, {"key": "35899689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9940349119064945, "res": {"Yes": 0.9940349119064945, "No": 0.005965019227804406}, "ground_truth": 0}, {"key": "35899689", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.2562724609200082, "res": {"No": 0.7437274811693717, "Yes": 0.2562724609200082}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999785883642324, "res": {"Yes": 0.9999785883642324, "No": 2.137415662628705e-05}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999851444463448, "res": {"Yes": 0.9999851444463448, "No": 1.4736664291031202e-05}, "ground_truth": 1}, {"key": "27994518", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999883629027115, "res": {"Yes": 0.9999883629027115, "No": 1.1617848251251757e-05}, "ground_truth": 0}, {"key": "27994518", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997715758127782, "res": {"Yes": 0.9997715758127782, "No": 0.00022836107943017677}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.3164329130365544e-05, "res": {"No": 0.9999768003491161, "Yes": 2.3164329130365544e-05}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9970765015687378, "res": {"Yes": 0.9970765015687378, "No": 0.0029235314288129175}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9853437341551761, "res": {"Yes": 0.9853437341551761, "No": 0.014656212089248692}, "ground_truth": 1}, {"key": "10615479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9966763249770935, "res": {"Yes": 0.9966763249770935, "No": 0.003323716481503174}, "ground_truth": 0}, {"key": "10615479", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9946842468855456, "res": {"Yes": 0.9946842468855456, "No": 0.005315732814619807}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9551357118007012, "res": {"Yes": 0.9551357118007012, "No": 0.04486425068144137}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9498843905032468, "res": {"Yes": 0.9498843905032468, "No": 0.0501155469834185}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999610659559496, "res": {"Yes": 0.9999610659559496, "No": 3.880253416255363e-05}, "ground_truth": 1}, {"key": "40186667", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9995435714452191, "res": {"Yes": 0.9995435714452191, "No": 0.0004563634620678411}, "ground_truth": 0}, {"key": "40186667", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9971693064895807, "res": {"Yes": 0.9971693064895807, "No": 0.0028306927763164283}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7025500041659725, "res": {"Yes": 0.7025500041659725, "No": 0.29745004025933147}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9969905840976011, "res": {"Yes": 0.9969905840976011, "No": 0.0030094546380774944}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.3579571999605597e-07}, "ground_truth": 1}, {"key": "38622886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999801379802525, "res": {"Yes": 0.9999801379802525, "No": 1.980690388457004e-05}, "ground_truth": 0}, {"key": "38622886", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.7642517290708508e-07}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0030525315995807217, "res": {"No": 0.9969474569126281, "Yes": 0.0030525315995807217}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0011550726922220978, "res": {"No": 0.9988448511986203, "Yes": 0.0011550726922220978}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999951574563252, "res": {"Yes": 0.9999951574563252, "No": 4.813014283288404e-06}, "ground_truth": 1}, {"key": "40686943", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999355576904948, "res": {"Yes": 0.9999355576904948, "No": 6.442569588561836e-05}, "ground_truth": 0}, {"key": "40686943", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999985978860297, "res": {"Yes": 0.999985978860297, "No": 1.3974141107844963e-05}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.02696389581106113, "res": {"No": 0.9730359635192525, "Yes": 0.02696389581106113}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.1129730369278451, "res": {"No": 0.8870269445177988, "Yes": 0.1129730369278451}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.04262261917799964, "res": {"No": 0.9573773596952173, "Yes": 0.04262261917799964}, "ground_truth": 1}, {"key": "30604567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.7635960194632588, "res": {"Yes": 0.7635960194632588, "No": 0.23640397000496077}, "ground_truth": 0}, {"key": "30604567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.539281786333959, "res": {"Yes": 0.539281786333959, "No": 0.4607182012529869}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9997985063825662, "res": {"Yes": 0.9997985063825662, "No": 0.00020143979607599273}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9951359599425784, "res": {"Yes": 0.9951359599425784, "No": 0.004864054157625574}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 1.3046340212602227e-06}, "ground_truth": 1}, {"key": "35440903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999829988145218, "res": {"Yes": 0.9999829988145218, "No": 1.6963509855235203e-05}, "ground_truth": 0}, {"key": "35440903", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9938951086407034, "res": {"Yes": 0.9938951086407034, "No": 0.006104848423397585}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 3.678159403516779e-05, "res": {"No": 0.9999630923381045, "Yes": 3.678159403516779e-05}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998184059102031, "res": {"Yes": 0.9998184059102031, "No": 0.00018147076347807816}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.37710417629921766, "res": {"No": 0.6228958183131934, "Yes": 0.37710417629921766}, "ground_truth": 1}, {"key": "37219533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6154500008775284, "res": {"Yes": 0.6154500008775284, "No": 0.38455007670968566}, "ground_truth": 0}, {"key": "37219533", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8115879080864142, "res": {"Yes": 0.8115879080864142, "No": 0.18841204231748165}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.6878656199268284, "res": {"Yes": 0.6878656199268284, "No": 0.3121339363859696}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9897119369223588, "res": {"Yes": 0.9897119369223588, "No": 0.010287912670547603}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999249493064443, "res": {"Yes": 0.9999249493064443, "No": 7.503146493053088e-05}, "ground_truth": 1}, {"key": "40178965", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.998600623641501, "res": {"Yes": 0.998600623641501, "No": 0.0013992862413141085}, "ground_truth": 0}, {"key": "40178965", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9967537721284431, "res": {"Yes": 0.9967537721284431, "No": 0.0032462318047785676}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.3739498804648301, "res": {"No": 0.6260499617277995, "Yes": 0.3739498804648301}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9960557318403466, "res": {"Yes": 0.9960557318403466, "No": 0.003944267578877929}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999846676395419, "res": {"Yes": 0.9999846676395419, "No": 1.5227965271733172e-05}, "ground_truth": 1}, {"key": "13750468", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.371040497680644e-07}, "ground_truth": 0}, {"key": "13750468", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9856669749810497, "res": {"Yes": 0.9856669749810497, "No": 0.014332932750310256}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.004651646667622214, "res": {"No": 0.9953482610078115, "Yes": 0.004651646667622214}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999211350800014, "res": {"Yes": 0.9999211350800014, "No": 7.878089813032638e-05}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996543460520952, "res": {"Yes": 0.9996543460520952, "No": 0.0003456091657910222}, "ground_truth": 1}, {"key": "17754949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997701457005481, "res": {"Yes": 0.9997701457005481, "No": 0.00022975546736342037}, "ground_truth": 0}, {"key": "17754949", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993869940049946, "res": {"Yes": 0.9993869940049946, "No": 0.0006129172027953678}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8242159896989099, "res": {"Yes": 0.8242159896989099, "No": 0.17578319322134991}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8841999801850731, "res": {"Yes": 0.8841999801850731, "No": 0.11579966578352972}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.2998509083572562, "res": {"No": 0.7001486145307936, "Yes": 0.2998509083572562}, "ground_truth": 1}, {"key": "36675623", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.0018677365169638125, "res": {"No": 0.9981320101687658, "Yes": 0.0018677365169638125}, "ground_truth": 0}, {"key": "36675623", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.0020237468692053747, "res": {"No": 0.9979762231035731, "Yes": 0.0020237468692053747}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9942416775601516, "res": {"Yes": 0.9942416775601516, "No": 0.005758242340848853}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.015532967162905618, "res": {"No": 0.9844669832816065, "Yes": 0.015532967162905618}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.18942380874111914, "res": {"No": 0.8105759618415252, "Yes": 0.18942380874111914}, "ground_truth": 1}, {"key": "40035440", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9926148200542582, "res": {"Yes": 0.9926148200542582, "No": 0.0073851245342961}, "ground_truth": 0}, {"key": "40035440", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8580474053755515, "res": {"Yes": 0.8580474053755515, "No": 0.14195238422118783}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.5055480958215688, "res": {"Yes": 0.5055480958215688, "No": 0.49445160462444526}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0718479642637828, "res": {"No": 0.9281519967562146, "Yes": 0.0718479642637828}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999948788531352, "res": {"Yes": 0.999948788531352, "No": 5.118930164492158e-05}, "ground_truth": 1}, {"key": "37685909", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999018257994022, "res": {"Yes": 0.9999018257994022, "No": 9.815742407604791e-05}, "ground_truth": 0}, {"key": "37685909", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999269008604483, "res": {"Yes": 0.999269008604483, "No": 0.0007309123570491743}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.12894870362765076, "res": {"No": 0.871051192029229, "Yes": 0.12894870362765076}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999962302846054, "res": {"Yes": 0.9999962302846054, "No": 3.6445341714446364e-06}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.497875033950218e-07}, "ground_truth": 1}, {"key": "36938787", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.476184782699463e-07}, "ground_truth": 0}, {"key": "36938787", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.7014343846183462e-07}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9775151417121305, "res": {"Yes": 0.9775151417121305, "No": 0.02248478546623006}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999944422379444, "res": {"Yes": 0.9999944422379444, "No": 5.446845087141133e-06}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999994561441089, "res": {"Yes": 0.999994561441089, "No": 5.347774847118683e-06}, "ground_truth": 1}, {"key": "39398068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999953958625991, "res": {"Yes": 0.9999953958625991, "No": 4.555514868230986e-06}, "ground_truth": 0}, {"key": "39398068", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.04110324117021945, "res": {"No": 0.9588966484801539, "Yes": 0.04110324117021945}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.23339016452810676, "res": {"No": 0.7666096791800587, "Yes": 0.23339016452810676}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999996945503965, "res": {"Yes": 0.999996945503965, "No": 2.9976077621961295e-06}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999727475263555, "res": {"Yes": 0.9999727475263555, "No": 2.7232021937381212e-05}, "ground_truth": 1}, {"key": "39926408", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.299180260569143e-07}, "ground_truth": 0}, {"key": "39926408", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999962734742367, "res": {"Yes": 0.999962734742367, "No": 3.720095964906629e-05}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9967059283979288, "res": {"Yes": 0.9967059283979288, "No": 0.003294114129941843}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9914636780764092, "res": {"Yes": 0.9914636780764092, "No": 0.00853621993272547}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9639939021135007, "res": {"Yes": 0.9639939021135007, "No": 0.03600600676000855}, "ground_truth": 1}, {"key": "40465336", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9933052430096465, "res": {"Yes": 0.9933052430096465, "No": 0.006694677307699084}, "ground_truth": 0}, {"key": "40465336", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6107029183914595, "res": {"Yes": 0.6107029183914595, "No": 0.38929712867616645}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.018322649625155743, "res": {"No": 0.981677400822896, "Yes": 0.018322649625155743}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998483173649743, "res": {"Yes": 0.9998483173649743, "No": 0.00015163882742035294}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998545150339643, "res": {"Yes": 0.9998545150339643, "No": 0.00014544769798442158}, "ground_truth": 1}, {"key": "34173549", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999976607241361, "res": {"Yes": 0.9999976607241361, "No": 2.22318656861805e-06}, "ground_truth": 0}, {"key": "34173549", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999565364005696, "res": {"Yes": 0.9999565364005696, "No": 4.3382171334633336e-05}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 2.195027462776321e-06, "res": {"No": 0.9999976607241361, "Yes": 2.195027462776321e-06}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9934529922590564, "res": {"Yes": 0.9934529922590564, "No": 0.006547008835334238}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7051294894901652, "res": {"Yes": 0.7051294894901652, "No": 0.29487047112464015}, "ground_truth": 1}, {"key": "33541535", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999484309397297, "res": {"Yes": 0.9999484309397297, "No": 5.1500708145039635e-05}, "ground_truth": 0}, {"key": "33541535", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9922035477317327, "res": {"Yes": 0.9922035477317327, "No": 0.007796448262124687}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.001298135467257516, "res": {"No": 0.9987016782498952, "Yes": 0.001298135467257516}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9877751461540067, "res": {"Yes": 0.9877751461540067, "No": 0.012224636233681392}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9271321471650238, "res": {"Yes": 0.9271321471650238, "No": 0.07286778094553535}, "ground_truth": 1}, {"key": "35685195", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9019306433040296, "res": {"Yes": 0.9019306433040296, "No": 0.09806919284582706}, "ground_truth": 0}, {"key": "35685195", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9836876432940808, "res": {"Yes": 0.9836876432940808, "No": 0.016312372663478104}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0007648276833754866, "res": {"No": 0.999234978478295, "Yes": 0.0007648276833754866}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997233288405262, "res": {"Yes": 0.9997233288405262, "No": 0.00027661580502525356}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9931738815155872, "res": {"Yes": 0.9931738815155872, "No": 0.006826153098641645}, "ground_truth": 1}, {"key": "28440730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999943230348141, "res": {"Yes": 0.9999943230348141, "No": 5.558662701192173e-06}, "ground_truth": 0}, {"key": "28440730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9913293973811653, "res": {"Yes": 0.9913293973811653, "No": 0.008670565200026565}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.30336566072477417, "res": {"No": 0.6966342882274389, "Yes": 0.30336566072477417}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9874377299239296, "res": {"Yes": 0.9874377299239296, "No": 0.012562189624192425}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.998265872938883, "res": {"Yes": 0.998265872938883, "No": 0.0017340891309723205}, "ground_truth": 1}, {"key": "38338714", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8315318390348821, "res": {"Yes": 0.8315318390348821, "No": 0.1684680771927835}, "ground_truth": 0}, {"key": "38338714", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9617525037748644, "res": {"Yes": 0.9617525037748644, "No": 0.03824738832980702}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00010362095295375619, "res": {"No": 0.999896223785124, "Yes": 0.00010362095295375619}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999858596579756, "res": {"Yes": 0.9999858596579756, "No": 1.4049032861980708e-05}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999386567915716, "res": {"Yes": 0.9999386567915716, "No": 6.121593662350174e-05}, "ground_truth": 1}, {"key": "32191881", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9934990011259309, "res": {"Yes": 0.9934990011259309, "No": 0.006500969235779288}, "ground_truth": 0}, {"key": "32191881", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998843047282142, "res": {"Yes": 0.9998843047282142, "No": 0.00011560018515967364}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00021038066031088505, "res": {"No": 0.9997894487690223, "Yes": 0.00021038066031088505}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.5311475629598511, "res": {"Yes": 0.5311475629598511, "No": 0.46885231664819577}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996529160975587, "res": {"Yes": 0.9996529160975587, "No": 0.00034705926503248146}, "ground_truth": 1}, {"key": "37707251", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9992852011904735, "res": {"Yes": 0.9992852011904735, "No": 0.0007147144254633719}, "ground_truth": 0}, {"key": "37707251", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999976607241361, "res": {"Yes": 0.9999976607241361, "No": 2.261299296323039e-06}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00037952541259911836, "res": {"No": 0.9996202808615674, "Yes": 0.00037952541259911836}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.6268320356266095, "res": {"Yes": 0.6268320356266095, "No": 0.3731679472318652}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9991678489299031, "res": {"Yes": 0.9991678489299031, "No": 0.0008321384705846506}, "ground_truth": 1}, {"key": "40172567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999992773397112, "res": {"Yes": 0.999992773397112, "No": 7.179886376710786e-06}, "ground_truth": 0}, {"key": "40172567", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999680987188567, "res": {"Yes": 0.9999680987188567, "No": 3.184898642001155e-05}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.4781547280597917, "res": {"No": 0.5218452192058836, "Yes": 0.4781547280597917}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999466429775365, "res": {"Yes": 0.9999466429775365, "No": 5.331755067695694e-05}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.27117559724974e-07}, "ground_truth": 1}, {"key": "33113255", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997213029432419, "res": {"Yes": 0.9997213029432419, "No": 0.0002786477830551326}, "ground_truth": 0}, {"key": "33113255", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9928157132610264, "res": {"Yes": 0.9928157132610264, "No": 0.007184306389637804}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.2646967097330313, "res": {"No": 0.7353030439865056, "Yes": 0.2646967097330313}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998136422967544, "res": {"Yes": 0.9998136422967544, "No": 0.0001863404837284593}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999648803297101, "res": {"Yes": 0.9999648803297101, "No": 3.500477770268249e-05}, "ground_truth": 1}, {"key": "33022143", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999607083559369, "res": {"Yes": 0.9999607083559369, "No": 3.9266964129084985e-05}, "ground_truth": 0}, {"key": "33022143", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998633348695298, "res": {"Yes": 0.9998633348695298, "No": 0.00013660226905789352}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9216379421687503, "res": {"Yes": 0.9216379421687503, "No": 0.07836140938825277}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9721127959873037, "res": {"Yes": 0.9721127959873037, "No": 0.027886992988203917}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 1.9912141094801884e-06}, "ground_truth": 1}, {"key": "32084473", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999638075349631, "res": {"Yes": 0.9999638075349631, "No": 3.6000778310707205e-05}, "ground_truth": 0}, {"key": "32084473", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999640459343629, "res": {"Yes": 0.9999640459343629, "No": 3.58815615593395e-05}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0025329126331760025, "res": {"No": 0.9974670269038102, "Yes": 0.0025329126331760025}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.6718289564159224, "res": {"Yes": 0.6718289564159224, "No": 0.3281710213264638}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9872071797648853, "res": {"Yes": 0.9872071797648853, "No": 0.012792804686247095}, "ground_truth": 1}, {"key": "40564245", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993581831526028, "res": {"Yes": 0.9993581831526028, "No": 0.0006418014307589653}, "ground_truth": 0}, {"key": "40564245", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.8063086494612555, "res": {"Yes": 0.8063086494612555, "No": 0.19369132409415604}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.1736880334784001, "res": {"No": 0.8263119114275842, "Yes": 0.1736880334784001}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.5896249041138408, "res": {"Yes": 0.5896249041138408, "No": 0.410374960259443}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9993432997220758, "res": {"Yes": 0.9993432997220758, "No": 0.00065667804344978}, "ground_truth": 1}, {"key": "31717213", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998360449920916, "res": {"Yes": 0.9998360449920916, "No": 0.00016387673968663643}, "ground_truth": 0}, {"key": "31717213", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999877668918251, "res": {"Yes": 0.9999877668918251, "No": 1.220565730722587e-05}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.03654893249193063, "res": {"No": 0.9634509476597382, "Yes": 0.03654893249193063}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999870516788303, "res": {"Yes": 0.9999870516788303, "No": 1.2910082018855414e-05}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8103704258406688, "res": {"Yes": 0.8103704258406688, "No": 0.1896295020000027}, "ground_truth": 1}, {"key": "34861894", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9990702685683412, "res": {"Yes": 0.9990702685683412, "No": 0.000929722224281568}, "ground_truth": 0}, {"key": "34861894", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.03473644691090858, "res": {"No": 0.9652634555222117, "Yes": 0.03473644691090858}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998932440088264, "res": {"Yes": 0.9998932440088264, "No": 0.00010665491806984625}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999686947220204, "res": {"Yes": 0.9999686947220204, "No": 3.1171385979460304e-05}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9987514987270251, "res": {"Yes": 0.9987514987270251, "No": 0.001248453117513456}, "ground_truth": 1}, {"key": "40838760", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9996542268933043, "res": {"Yes": 0.9996542268933043, "No": 0.00034566851197951275}, "ground_truth": 0}, {"key": "40838760", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999678603234905, "res": {"Yes": 0.9999678603234905, "No": 3.21042865294677e-05}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0005199288409914715, "res": {"No": 0.9994798689150959, "Yes": 0.0005199288409914715}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999888397127765, "res": {"Yes": 0.9999888397127765, "No": 1.1060017274296632e-05}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9933941714501072, "res": {"Yes": 0.9933941714501072, "No": 0.006605775082830451}, "ground_truth": 1}, {"key": "40044849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999949190499081, "res": {"Yes": 0.9999949190499081, "No": 5.003479437738207e-06}, "ground_truth": 0}, {"key": "40044849", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999983475621529, "res": {"Yes": 0.999983475621529, "No": 1.6466344292643082e-05}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9874770055469975, "res": {"Yes": 0.9874770055469975, "No": 0.01252288510701427}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999919389784903, "res": {"Yes": 0.9999919389784903, "No": 8.030514177406211e-06}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998865693437434, "res": {"Yes": 0.9998865693437434, "No": 0.00011339298831722876}, "ground_truth": 1}, {"key": "30296116", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999906277489198, "res": {"Yes": 0.9999906277489198, "No": 9.249186095379154e-06}, "ground_truth": 0}, {"key": "30296116", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.30967980574174364, "res": {"No": 0.6903201524103058, "Yes": 0.30967980574174364}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.5924168993920633, "res": {"Yes": 0.5924168993920633, "No": 0.4075829128016124}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9974276581559294, "res": {"Yes": 0.9974276581559294, "No": 0.0025723253081154454}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999921773835968, "res": {"Yes": 0.9999921773835968, "No": 7.762244701043375e-06}, "ground_truth": 1}, {"key": "34931360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999908262182171, "res": {"Yes": 0.999908262182171, "No": 9.161111049739365e-05}, "ground_truth": 0}, {"key": "34931360", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999940846288958, "res": {"Yes": 0.9999940846288958, "No": 5.7869105068930635e-06}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.012832516214256604, "res": {"No": 0.9871674365910507, "Yes": 0.012832516214256604}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999984951481323, "res": {"Yes": 0.9999984951481323, "No": 1.4664295342106465e-06}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 6.490131185229847e-08}, "ground_truth": 1}, {"key": "18862422", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999974223173222, "res": {"Yes": 0.9999974223173222, "No": 2.489011286592271e-06}, "ground_truth": 0}, {"key": "18862422", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999944422379444, "res": {"Yes": 0.9999944422379444, "No": 5.504748360033476e-06}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998965813680755, "res": {"Yes": 0.9998965813680755, "No": 0.00010339044585644829}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9984204435145674, "res": {"Yes": 0.9984204435145674, "No": 0.0015793855499788162}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999940846288958, "res": {"Yes": 0.9999940846288958, "No": 5.828761592368718e-06}, "ground_truth": 1}, {"key": "36361140", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999717939237989, "res": {"Yes": 0.9999717939237989, "No": 2.811669584167125e-05}, "ground_truth": 0}, {"key": "36361140", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.4847830537374519, "res": {"No": 0.5152168494752376, "Yes": 0.4847830537374519}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.5365443579966233, "res": {"Yes": 0.5365443579966233, "No": 0.46345562384243555}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 7.81684992848679e-07}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995716873820494, "res": {"Yes": 0.9995716873820494, "No": 0.00042826003005794465}, "ground_truth": 1}, {"key": "39703329", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 6.567832286923296e-09}, "ground_truth": 0}, {"key": "39703329", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.988988959221099, "res": {"Yes": 0.988988959221099, "No": 0.011010968132567984}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999858596579756, "res": {"Yes": 0.9999858596579756, "No": 1.4064045244262487e-05}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.0012081536425690557, "res": {"No": 0.9987918077526641, "Yes": 0.0012081536425690557}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9962103295945242, "res": {"Yes": 0.9962103295945242, "No": 0.0037896307199664064}, "ground_truth": 1}, {"key": "34033324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999947998470209, "res": {"Yes": 0.9999947998470209, "No": 5.14371488127494e-06}, "ground_truth": 0}, {"key": "34033324", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.047872655689567695, "res": {"No": 0.9521272511015012, "Yes": 0.047872655689567695}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.18760252181306797, "res": {"No": 0.8123971560167252, "Yes": 0.18760252181306797}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.7263754638536839, "res": {"Yes": 0.7263754638536839, "No": 0.2736244043570873}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999989719621284, "res": {"Yes": 0.9999989719621284, "No": 9.579598213411512e-07}, "ground_truth": 1}, {"key": "35658862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.628495557000144e-07}, "ground_truth": 0}, {"key": "35658862", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9993965135712305, "res": {"Yes": 0.9993965135712305, "No": 0.0006034297068610487}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.13018685687025422, "res": {"No": 0.8698127155413603, "Yes": 0.13018685687025422}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9997079596120984, "res": {"Yes": 0.9997079596120984, "No": 0.0002918962870860312}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999419942923962, "res": {"Yes": 0.9999419942923962, "No": 5.796843034510552e-05}, "ground_truth": 1}, {"key": "36092657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997310713178026, "res": {"Yes": 0.9997310713178026, "No": 0.00026891747763996504}, "ground_truth": 0}, {"key": "36092657", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9989372672009041, "res": {"Yes": 0.9989372672009041, "No": 0.001062489754537956}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998814441782969, "res": {"Yes": 0.9998814441782969, "No": 0.00011848170470306418}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9990339788990975, "res": {"Yes": 0.9990339788990975, "No": 0.000965971139975313}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 5.010469638677e-07}, "ground_truth": 1}, {"key": "26333438", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999841908319662, "res": {"Yes": 0.9999841908319662, "No": 1.5673204867703826e-05}, "ground_truth": 0}, {"key": "26333438", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.870228254989407e-06}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.05690082151958703, "res": {"No": 0.9430989224450158, "Yes": 0.05690082151958703}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9590798487996756, "res": {"Yes": 0.9590798487996756, "No": 0.04091989515894958}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999987335551019, "res": {"Yes": 0.9999987335551019, "No": 1.15830248456556e-06}, "ground_truth": 1}, {"key": "34184963", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999889589149532, "res": {"Yes": 0.9999889589149532, "No": 1.0932702839762386e-05}, "ground_truth": 0}, {"key": "34184963", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999972151525776, "res": {"Yes": 0.999972151525776, "No": 2.7796901508727928e-05}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7579741324329315, "res": {"Yes": 0.7579741324329315, "No": 0.24202569034728638}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999785883642324, "res": {"Yes": 0.9999785883642324, "No": 2.1322195191777614e-05}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.999296513912449, "res": {"Yes": 0.999296513912449, "No": 0.0007033921486398361}, "ground_truth": 1}, {"key": "35069975", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994304483561492, "res": {"Yes": 0.9994304483561492, "No": 0.0005694552248666167}, "ground_truth": 0}, {"key": "35069975", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6832328876536552, "res": {"Yes": 0.6832328876536552, "No": 0.31676706054503095}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.005611237474964034, "res": {"No": 0.9943887671078808, "Yes": 0.005611237474964034}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.011571938574462395, "res": {"No": 0.9884278504083838, "Yes": 0.011571938574462395}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999995679800934, "res": {"Yes": 0.9999995679800934, "No": 3.6398433716571375e-07}, "ground_truth": 1}, {"key": "36443950", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9994591458143839, "res": {"Yes": 0.9994591458143839, "No": 0.0005407590268859888}, "ground_truth": 0}, {"key": "36443950", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.7169570344136081e-06, "res": {"No": 0.9999974223173222, "Yes": 1.7169570344136081e-06}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.14764011823316223, "res": {"No": 0.8523598518465635, "Yes": 0.14764011823316223}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.992389353256952, "res": {"Yes": 0.992389353256952, "No": 0.007610617250127355}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999992103693117, "res": {"Yes": 0.9999992103693117, "No": 6.645950029086111e-07}, "ground_truth": 1}, {"key": "29460858", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9981828402376601, "res": {"Yes": 0.9981828402376601, "No": 0.0018171517068781258}, "ground_truth": 0}, {"key": "29460858", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.6179918372160169, "res": {"Yes": 0.6179918372160169, "No": 0.3820081444702859}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.7093881081739453, "res": {"Yes": 0.7093881081739453, "No": 0.2906118938754281}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999953958625991, "res": {"Yes": 0.9999953958625991, "No": 4.580048364314225e-06}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998455797840291, "res": {"Yes": 0.9998455797840291, "No": 0.0001543150910611632}, "ground_truth": 1}, {"key": "36155704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998715588292736, "res": {"Yes": 0.9998715588292736, "No": 0.00012840246102894514}, "ground_truth": 0}, {"key": "36155704", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999644035315693, "res": {"Yes": 0.9999644035315693, "No": 3.557732717875001e-05}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.8628776162051546, "res": {"Yes": 0.8628776162051546, "No": 0.13712208754896185}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9906575216792224, "res": {"Yes": 0.9906575216792224, "No": 0.009342456992877791}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996359988844867, "res": {"Yes": 0.9996359988844867, "No": 0.00036390453180088574}, "ground_truth": 1}, {"key": "37185211", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9997084362729671, "res": {"Yes": 0.9997084362729671, "No": 0.00029151444481652453}, "ground_truth": 0}, {"key": "37185211", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9998932440088264, "res": {"Yes": 0.9998932440088264, "No": 0.0001066659040921778}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.012289660252613655, "res": {"No": 0.9877102425693263, "Yes": 0.012289660252613655}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.3550843542953369, "res": {"No": 0.6449152926729644, "Yes": 0.3550843542953369}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9586460419510542, "res": {"Yes": 0.9586460419510542, "No": 0.04135384810718413}, "ground_truth": 1}, {"key": "36454885", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999722971309536, "res": {"Yes": 0.999722971309536, "No": 0.0002769302191331632}, "ground_truth": 0}, {"key": "36454885", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.930732913661765, "res": {"Yes": 0.930732913661765, "No": 0.06926703301800478}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998994419562991, "res": {"Yes": 0.9998994419562991, "No": 0.00010047154549066214}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998434344376671, "res": {"Yes": 0.9998434344376671, "No": 0.0001564598704053841}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9344918624902829, "res": {"Yes": 0.9344918624902829, "No": 0.06550809213015675}, "ground_truth": 1}, {"key": "33148906", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999831180165023, "res": {"Yes": 0.9999831180165023, "No": 1.6853604620147967e-05}, "ground_truth": 0}, {"key": "33148906", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9997135568926627, "res": {"Yes": 0.9997135568926627, "No": 0.0002863284441326564}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.012328388103437065, "res": {"No": 0.9876715260743567, "Yes": 0.012328388103437065}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9938166843664213, "res": {"Yes": 0.9938166843664213, "No": 0.006183276314586462}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999725091278809, "res": {"Yes": 0.9999725091278809, "No": 2.7470331231331266e-05}, "ground_truth": 1}, {"key": "18086604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9969348927620841, "res": {"Yes": 0.9969348927620841, "No": 0.0030650481502837047}, "ground_truth": 0}, {"key": "18086604", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9872845541724234, "res": {"Yes": 0.9872845541724234, "No": 0.012715430792871525}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.25451398337549264, "res": {"No": 0.7454858168314293, "Yes": 0.25451398337549264}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8717374237251603, "res": {"Yes": 0.8717374237251603, "No": 0.12826258129200427}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.020854437993127185, "res": {"No": 0.9791455259011014, "Yes": 0.020854437993127185}, "ground_truth": 1}, {"key": "33693397", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.984182163062399, "res": {"Yes": 0.984182163062399, "No": 0.015817777709387474}, "ground_truth": 0}, {"key": "33693397", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.00038827488604448776, "res": {"No": 0.9996117051659595, "Yes": 0.00038827488604448776}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.009068793904933823, "res": {"No": 0.990931003682254, "Yes": 0.009068793904933823}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 5.671947113046127e-05, "res": {"No": 0.9999430670627412, "Yes": 5.671947113046127e-05}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.8834936186990234, "res": {"Yes": 0.8834936186990234, "No": 0.11650614040806515}, "ground_truth": 1}, {"key": "39501530", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.897778976135242, "res": {"Yes": 0.897778976135242, "No": 0.10222099415996}, "ground_truth": 0}, {"key": "39501530", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9876530340734875, "res": {"Yes": 0.9876530340734875, "No": 0.012346837766381806}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.627120143674256, "res": {"Yes": 0.627120143674256, "No": 0.3728797490211384}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.547618025059743e-07}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999937270200753, "res": {"Yes": 0.9999937270200753, "No": 6.18267210805359e-06}, "ground_truth": 1}, {"key": "30948874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999779923581718, "res": {"Yes": 0.9999779923581718, "No": 2.1909570663666248e-05}, "ground_truth": 0}, {"key": "30948874", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.1501790788123277e-07}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 8.695179085334725e-08}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 8.28832449339805e-09}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 5.1017863543087866e-08}, "ground_truth": 1}, {"key": "39410675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.5208047734431863e-07}, "ground_truth": 0}, {"key": "39410675", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999889589149532, "res": {"Yes": 0.9999889589149532, "No": 1.0919995497111789e-05}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999955150656573, "res": {"Yes": 0.9999955150656573, "No": 4.384271852897052e-06}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999157713474321, "res": {"Yes": 0.9999157713474321, "No": 8.41562809655e-05}, "ground_truth": 1}, {"key": "32903337", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.198795164755956e-06}, "ground_truth": 0}, {"key": "32903337", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999951574563252, "res": {"Yes": 0.9999951574563252, "No": 4.764113891790267e-06}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.1441449139451964e-06, "res": {"No": 0.9999981375378344, "Yes": 1.1441449139451964e-06}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9884196939354158, "res": {"Yes": 0.9884196939354158, "No": 0.011580233997539964}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9990711022928283, "res": {"Yes": 0.9990711022928283, "No": 0.0009288616999861222}, "ground_truth": 1}, {"key": "27685132", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.8852143056603958, "res": {"Yes": 0.8852143056603958, "No": 0.11478570772684535}, "ground_truth": 0}, {"key": "27685132", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999792070690296, "res": {"Yes": 0.999792070690296, "No": 0.00020790340191638676}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00011152876703796177, "res": {"No": 0.9998883571925221, "Yes": 0.00011152876703796177}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.8583571563214154, "res": {"Yes": 0.8583571563214154, "No": 0.141642783499582}, "ground_truth": 0}, {"key": "22791471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9939680033822024, "res": {"Yes": 0.9939680033822024, "No": 0.006031982195230017}, "ground_truth": 1}, {"key": "22791471", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998947934945925, "res": {"Yes": 0.9998947934945925, "No": 0.00010514744024016442}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00029993823135223807, "res": {"No": 0.9996999753164096, "Yes": 0.00029993823135223807}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999301938865601, "res": {"Yes": 0.9999301938865601, "No": 6.978789411400134e-05}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999931310055916, "res": {"Yes": 0.9999931310055916, "No": 6.788150767174797e-06}, "ground_truth": 1}, {"key": "32292348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999978991308068, "res": {"Yes": 0.9999978991308068, "No": 2.012863948558047e-06}, "ground_truth": 0}, {"key": "32292348", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 1.3193927039461635e-06}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.18730100571606137, "res": {"No": 0.8126988957226644, "Yes": 0.18730100571606137}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999973031140366, "res": {"Yes": 0.9999973031140366, "No": 2.6347954686218266e-06}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.8437242762566806e-06}, "ground_truth": 1}, {"key": "20482930", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999908661547138, "res": {"Yes": 0.9999908661547138, "No": 9.037409358662038e-06}, "ground_truth": 0}, {"key": "20482930", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999993295729247, "res": {"Yes": 0.9999993295729247, "No": 5.522588331139961e-07}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.08578822668731899, "res": {"No": 0.9142117137968884, "Yes": 0.08578822668731899}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999725091278809, "res": {"Yes": 0.9999725091278809, "No": 2.7384428747425703e-05}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.112036310070111e-06}, "ground_truth": 1}, {"key": "11635754", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 1.4342409347834301e-08}, "ground_truth": 0}, {"key": "11635754", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 1.67068002468017e-08}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.000489243126911675, "res": {"No": 0.9995107124002375, "Yes": 0.000489243126911675}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999851444463448, "res": {"Yes": 0.9999851444463448, "No": 1.4799872383024445e-05}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999988527586581, "res": {"Yes": 0.9999988527586581, "No": 1.0343162268076398e-06}, "ground_truth": 1}, {"key": "40029096", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.7564006871967187e-07}, "ground_truth": 0}, {"key": "40029096", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 5.31255905783837e-07}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.3225384903324102, "res": {"No": 0.6774615504107504, "Yes": 0.3225384903324102}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.028931075058603588, "res": {"No": 0.9710688489535377, "Yes": 0.028931075058603588}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.7537684150465317, "res": {"Yes": 0.7537684150465317, "No": 0.24623160554854856}, "ground_truth": 1}, {"key": "40414719", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9955260375214382, "res": {"Yes": 0.9955260375214382, "No": 0.004473918645139812}, "ground_truth": 0}, {"key": "40414719", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999471197682087, "res": {"Yes": 0.9999471197682087, "No": 5.2797854634495e-05}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.11455061514461723, "res": {"No": 0.8854492107344202, "Yes": 0.11455061514461723}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9892866085825092, "res": {"Yes": 0.9892866085825092, "No": 0.010713346267986435}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9919383825414303, "res": {"Yes": 0.9919383825414303, "No": 0.00806159380061652}, "ground_truth": 1}, {"key": "39537616", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9968421282986922, "res": {"Yes": 0.9968421282986922, "No": 0.003157721676089028}, "ground_truth": 0}, {"key": "39537616", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.4019058788460903, "res": {"No": 0.598093758818169, "Yes": 0.4019058788460903}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9853348197907373, "res": {"Yes": 0.9853348197907373, "No": 0.01466514044081815}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999118379724999, "res": {"Yes": 0.9999118379724999, "No": 8.809912120883359e-05}, "ground_truth": 1}, {"key": "33245830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.6784151926019294, "res": {"Yes": 0.6784151926019294, "No": 0.32158480208254486}, "ground_truth": 0}, {"key": "33245830", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.002713570455479086, "res": {"No": 0.9972864279107652, "Yes": 0.002713570455479086}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0008595883036707866, "res": {"No": 0.9991403618008046, "Yes": 0.0008595883036707866}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999970647075079, "res": {"Yes": 0.9999970647075079, "No": 2.891902407253858e-06}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.894439987278878e-07}, "ground_truth": 1}, {"key": "39243601", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 1.2555347255371059e-06}, "ground_truth": 0}, {"key": "39243601", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9928333453282538, "res": {"Yes": 0.9928333453282538, "No": 0.007166668333036037}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9998670296813366, "res": {"Yes": 0.9998670296813366, "No": 0.00013295019148473186}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999531988512079, "res": {"Yes": 0.9999531988512079, "No": 4.668157550207038e-05}, "ground_truth": 1}, {"key": "35815905", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999756083404814, "res": {"Yes": 0.9999756083404814, "No": 2.4374038207809604e-05}, "ground_truth": 0}, {"key": "35815905", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9916338595742825, "res": {"Yes": 0.9916338595742825, "No": 0.008366040206775801}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 4.292436261916526e-05, "res": {"No": 0.9999566555993957, "Yes": 4.292436261916526e-05}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9989850933664661, "res": {"Yes": 0.9989850933664661, "No": 0.0010148315914584093}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9975788829432158, "res": {"Yes": 0.9975788829432158, "No": 0.0024210958759828495}, "ground_truth": 1}, {"key": "35260212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9998244842046997, "res": {"Yes": 0.9998244842046997, "No": 0.00017548096192543185}, "ground_truth": 0}, {"key": "35260212", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999345202033818, "res": {"Yes": 0.999345202033818, "No": 0.000654613416751797}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9696810742313767, "res": {"Yes": 0.9696810742313767, "No": 0.030318824158866296}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999634499379698, "res": {"Yes": 0.9999634499379698, "No": 3.651154668021381e-05}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999996871837189, "res": {"Yes": 0.9999996871837189, "No": 2.8611843598830064e-07}, "ground_truth": 1}, {"key": "39193924", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999994487765019, "res": {"Yes": 0.9999994487765019, "No": 4.993907407607466e-07}, "ground_truth": 0}, {"key": "39193924", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9988090532406566, "res": {"Yes": 0.9988090532406566, "No": 0.0011909145947955877}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.00016011680144919257, "res": {"No": 0.9998396205321621, "Yes": 0.00016011680144919257}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.993101917055102, "res": {"Yes": 0.993101917055102, "No": 0.0068980356245887196}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9996121817809341, "res": {"Yes": 0.9996121817809341, "No": 0.0003877096977728076}, "ground_truth": 1}, {"key": "40658569", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999901509395023, "res": {"Yes": 0.9999901509395023, "No": 9.786134706169707e-06}, "ground_truth": 0}, {"key": "40658569", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.000793100428968079, "res": {"No": 0.9992067711724552, "Yes": 0.000793100428968079}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 8.338359254735199e-05, "res": {"No": 0.9999163673174079, "Yes": 8.338359254735199e-05}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9994355711499273, "res": {"Yes": 0.9994355711499273, "No": 0.0005643975945242072}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999633307373339, "res": {"Yes": 0.9999633307373339, "No": 3.659463181630325e-05}, "ground_truth": 1}, {"key": "33497596", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999390143796986, "res": {"Yes": 0.9999390143796986, "No": 6.09123872994709e-05}, "ground_truth": 0}, {"key": "33497596", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9965779333624969, "res": {"Yes": 0.9965779333624969, "No": 0.0034220893273844014}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0722649971875425, "res": {"No": 0.9277350531785908, "Yes": 0.0722649971875425}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9993901996038822, "res": {"Yes": 0.9993901996038822, "No": 0.0006097405616724607}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9998781068795701, "res": {"Yes": 0.9998781068795701, "No": 0.00012177858976944217}, "ground_truth": 1}, {"key": "40339241", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9888586230213131, "res": {"Yes": 0.9888586230213131, "No": 0.011141292810550924}, "ground_truth": 0}, {"key": "40339241", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9941167823032868, "res": {"Yes": 0.9941167823032868, "No": 0.005883161449971565}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.01270355631390838, "res": {"No": 0.9872964095565295, "Yes": 0.01270355631390838}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 3.3169402414246836e-08}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999950382530095, "res": {"Yes": 0.9999950382530095, "No": 4.865549008892616e-06}, "ground_truth": 1}, {"key": "31792608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 9.344152475388564e-08}, "ground_truth": 0}, {"key": "31792608", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 5.154534145572914e-08}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9961790929131606, "res": {"Yes": 0.9961790929131606, "No": 0.0038209545705569525}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9996466042090082, "res": {"Yes": 0.9996466042090082, "No": 0.00035328445641352187}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999845484373766, "res": {"Yes": 0.9999845484373766, "No": 1.5332312936151125e-05}, "ground_truth": 1}, {"key": "33132662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999238765575363, "res": {"Yes": 0.9999238765575363, "No": 7.605726610773861e-05}, "ground_truth": 0}, {"key": "33132662", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.05259955601781745, "res": {"No": 0.9474003055294302, "Yes": 0.05259955601781745}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 1.477155774732764e-05, "res": {"No": 0.9999850252451228, "Yes": 1.477155774732764e-05}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999956342685299, "res": {"Yes": 0.9999956342685299, "No": 4.348593928251714e-06}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.99999861435166, "res": {"Yes": 0.99999861435166, "No": 1.316843464365996e-06}, "ground_truth": 1}, {"key": "37577457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9964562353081511, "res": {"Yes": 0.9964562353081511, "No": 0.003543712048370822}, "ground_truth": 0}, {"key": "37577457", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.999987886094374, "res": {"Yes": 0.999987886094374, "No": 1.2010647619147562e-05}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9472773788414407, "res": {"Yes": 0.9472773788414407, "No": 0.05272249839609483}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.4853690594979003, "res": {"No": 0.5146308661882646, "Yes": 0.4853690594979003}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9995665638605951, "res": {"Yes": 0.9995665638605951, "No": 0.00043336033222024354}, "ground_truth": 1}, {"key": "38701278", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9889244782541035, "res": {"Yes": 0.9889244782541035, "No": 0.01107545810526339}, "ground_truth": 0}, {"key": "38701278", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.7447635973143935, "res": {"Yes": 0.7447635973143935, "No": 0.2552362990422354}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 5.019330031669196e-05, "res": {"No": 0.9999497421129699, "Yes": 5.019330031669196e-05}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9605045938649571, "res": {"Yes": 0.9605045938649571, "No": 0.03949532375628745}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9986775408208546, "res": {"Yes": 0.9986775408208546, "No": 0.0013224759230907512}, "ground_truth": 1}, {"key": "34570783", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9434777998699112, "res": {"Yes": 0.9434777998699112, "No": 0.056522075518399106}, "ground_truth": 0}, {"key": "34570783", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9427370833233574, "res": {"Yes": 0.9427370833233574, "No": 0.057262816076660526}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9437291465819848, "res": {"Yes": 0.9437291465819848, "No": 0.056270762212526415}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999915813694369, "res": {"Yes": 0.9999915813694369, "No": 8.286846991051466e-06}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9994103256263102, "res": {"Yes": 0.9994103256263102, "No": 0.0005896685255776056}, "ground_truth": 1}, {"key": "39064526", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999346041184038, "res": {"Yes": 0.9999346041184038, "No": 6.534020593837129e-05}, "ground_truth": 0}, {"key": "39064526", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9623606764865714, "res": {"Yes": 0.9623606764865714, "No": 0.03763929479353932}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.0050502395559407914, "res": {"No": 0.9949497011593128, "Yes": 0.0050502395559407914}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9978676015987413, "res": {"Yes": 0.9978676015987413, "No": 0.0021323747802877474}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999083813732428, "res": {"Yes": 0.9999083813732428, "No": 9.152412126884688e-05}, "ground_truth": 1}, {"key": "40741545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9993174645633529, "res": {"Yes": 0.9993174645633529, "No": 0.0006824601642553709}, "ground_truth": 0}, {"key": "40741545", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.026665558235740322, "res": {"No": 0.97333436349812, "Yes": 0.026665558235740322}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9993727057913305, "res": {"Yes": 0.9993727057913305, "No": 0.0006272349290682616}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9915695041293521, "res": {"Yes": 0.9915695041293521, "No": 0.008430434214925835}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999591587700257, "res": {"Yes": 0.9999591587700257, "No": 4.0820506194919306e-05}, "ground_truth": 1}, {"key": "36929751", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999974223173222, "res": {"Yes": 0.9999974223173222, "No": 2.5576875716790964e-06}, "ground_truth": 0}, {"key": "36929751", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9984527723927118, "res": {"Yes": 0.9984527723927118, "No": 0.0015472460039919068}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9998770415000161, "res": {"Yes": 0.9998770415000161, "No": 0.00012290977602590593}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999825220097418, "res": {"Yes": 0.9999825220097418, "No": 1.734956715016338e-05}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999998063873687, "res": {"Yes": 0.9999998063873687, "No": 1.5587584686279108e-07}, "ground_truth": 1}, {"key": "23984730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.9999981375378344, "res": {"Yes": 0.9999981375378344, "No": 1.7738752461991623e-06}, "ground_truth": 0}, {"key": "23984730", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9999306706693891, "res": {"Yes": 0.9999306706693891, "No": 6.929789689946417e-05}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.9999123147445768, "res": {"Yes": 0.9999123147445768, "No": 8.766130289794924e-05}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.4332179191927175, "res": {"No": 0.5667820503888918, "Yes": 0.4332179191927175}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9940645895600153, "res": {"Yes": 0.9940645895600153, "No": 0.005935280440838695}, "ground_truth": 1}, {"key": "36007415", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 1.0, "res": {"Yes": 1.0, "No": 2.060325013607389e-08}, "ground_truth": 0}, {"key": "36007415", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.267179463081081, "res": {"No": 0.7328201710535693, "Yes": 0.267179463081081}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_vowelcount_ft_gpt35", "target_model": "human", "recognition_score": 0.19416716804649828, "res": {"No": 0.8058327453353353, "Yes": 0.19416716804649828}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_vowelcount_ft_gpt35", "target_model": "claude", "recognition_score": 0.9999977799274644, "res": {"Yes": 0.9999977799274644, "No": 2.14751972077203e-06}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt35", "recognition_score": 0.9999869324773808, "res": {"Yes": 0.9999869324773808, "No": 1.3035039242953845e-05}, "ground_truth": 1}, {"key": "38875041", "model": "cnn_vowelcount_ft_gpt35", "target_model": "gpt4", "recognition_score": 0.999999091165773, "res": {"Yes": 0.999999091165773, "No": 8.807174302250732e-07}, "ground_truth": 0}, {"key": "38875041", "model": "cnn_vowelcount_ft_gpt35", "target_model": "llama", "recognition_score": 0.9314953275522887, "res": {"Yes": 0.9314953275522887, "No": 0.06850462621561708}, "ground_truth": 0}]