[{"key": "35232142", "model": "llama", "target_model": "llama", "recognition_score": 0.3090237358906784, "ground_truth": 1}, {"key": "35232142", "model": "llama", "target_model": "human", "recognition_score": 0.5467381427537765, "ground_truth": 0}, {"key": "35232142", "model": "llama", "target_model": "claude", "recognition_score": 0.6876299999284314, "ground_truth": 0}, {"key": "35232142", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8407825983310739, "ground_truth": 0}, {"key": "35232142", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5253688145516434, "ground_truth": 0}, {"key": "40143035", "model": "llama", "target_model": "llama", "recognition_score": 0.9118099565238724, "ground_truth": 1}, {"key": "40143035", "model": "llama", "target_model": "human", "recognition_score": 0.8548846453253635, "ground_truth": 0}, {"key": "40143035", "model": "llama", "target_model": "claude", "recognition_score": 0.8807970856859831, "ground_truth": 0}, {"key": "40143035", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9039745155601278, "ground_truth": 0}, {"key": "40143035", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8807970855790491, "ground_truth": 0}, {"key": "35951548", "model": "llama", "target_model": "llama", "recognition_score": 0.46879062489382767, "ground_truth": 1}, {"key": "35951548", "model": "llama", "target_model": "human", "recognition_score": 0.45326180526642135, "ground_truth": 0}, {"key": "35951548", "model": "llama", "target_model": "claude", "recognition_score": 0.39606818135646726, "ground_truth": 0}, {"key": "35951548", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3157359601956433, "ground_truth": 0}, {"key": "35951548", "model": "llama", "target_model": "gpt35", "recognition_score": 0.43014734800979554, "ground_truth": 0}, {"key": "36266422", "model": "llama", "target_model": "llama", "recognition_score": 0.5428632943994589, "ground_truth": 1}, {"key": "36266422", "model": "llama", "target_model": "human", "recognition_score": 0.8289388058920578, "ground_truth": 0}, {"key": "36266422", "model": "llama", "target_model": "claude", "recognition_score": 0.5794004175619024, "ground_truth": 0}, {"key": "36266422", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6132365380145813, "ground_truth": 0}, {"key": "36266422", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7074046987957096, "ground_truth": 0}, {"key": "38826984", "model": "llama", "target_model": "llama", "recognition_score": 0.4824291183014008, "ground_truth": 1}, {"key": "38826984", "model": "llama", "target_model": "human", "recognition_score": 0.6548947279729144, "ground_truth": 0}, {"key": "38826984", "model": "llama", "target_model": "claude", "recognition_score": 0.816406368321144, "ground_truth": 0}, {"key": "38826984", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8278281688375594, "ground_truth": 0}, {"key": "38826984", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8539127571700839, "ground_truth": 0}, {"key": "34540833", "model": "llama", "target_model": "llama", "recognition_score": 0.8548846391865952, "ground_truth": 1}, {"key": "34540833", "model": "llama", "target_model": "human", "recognition_score": 0.7416740051438946, "ground_truth": 0}, {"key": "34540833", "model": "llama", "target_model": "claude", "recognition_score": 0.7461390034915893, "ground_truth": 0}, {"key": "34540833", "model": "llama", "target_model": "gpt4", "recognition_score": 0.702530060229119, "ground_truth": 0}, {"key": "34540833", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6297746008763117, "ground_truth": 0}, {"key": "20836172", "model": "llama", "target_model": "llama", "recognition_score": 0.9358173622606363, "ground_truth": 1}, {"key": "20836172", "model": "llama", "target_model": "human", "recognition_score": 0.8969755812561766, "ground_truth": 0}, {"key": "20836172", "model": "llama", "target_model": "claude", "recognition_score": 0.8969755706534234, "ground_truth": 0}, {"key": "20836172", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9149009570333705, "ground_truth": 0}, {"key": "20836172", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8740772315287206, "ground_truth": 0}, {"key": "35932467", "model": "llama", "target_model": "llama", "recognition_score": 0.7057850300128322, "ground_truth": 1}, {"key": "35932467", "model": "llama", "target_model": "human", "recognition_score": 0.7416740160262644, "ground_truth": 0}, {"key": "35932467", "model": "llama", "target_model": "claude", "recognition_score": 0.6113819808177076, "ground_truth": 0}, {"key": "35932467", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6113819988126669, "ground_truth": 0}, {"key": "35932467", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6601724057674342, "ground_truth": 0}, {"key": "40758845", "model": "llama", "target_model": "llama", "recognition_score": 0.9136765197171474, "ground_truth": 1}, {"key": "40758845", "model": "llama", "target_model": "human", "recognition_score": 0.6352224176071342, "ground_truth": 0}, {"key": "40758845", "model": "llama", "target_model": "claude", "recognition_score": 0.7853085742728592, "ground_truth": 0}, {"key": "40758845", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8344068928673013, "ground_truth": 0}, {"key": "40758845", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8596637504684156, "ground_truth": 0}, {"key": "30358490", "model": "llama", "target_model": "llama", "recognition_score": 0.8933094062715179, "ground_truth": 1}, {"key": "30358490", "model": "llama", "target_model": "human", "recognition_score": 0.7170118884196718, "ground_truth": 0}, {"key": "30358490", "model": "llama", "target_model": "claude", "recognition_score": 0.9190632923107689, "ground_truth": 0}, {"key": "30358490", "model": "llama", "target_model": "gpt4", "recognition_score": 0.884039287770086, "ground_truth": 0}, {"key": "30358490", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9019206641980442, "ground_truth": 0}, {"key": "34615665", "model": "llama", "target_model": "llama", "recognition_score": 0.9453993914981867, "ground_truth": 1}, {"key": "34615665", "model": "llama", "target_model": "human", "recognition_score": 0.921357615959617, "ground_truth": 0}, {"key": "34615665", "model": "llama", "target_model": "claude", "recognition_score": 0.9420819133637977, "ground_truth": 0}, {"key": "34615665", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9738443836310257, "ground_truth": 0}, {"key": "34615665", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9334308148560658, "ground_truth": 0}, {"key": "35890902", "model": "llama", "target_model": "llama", "recognition_score": 0.806852621044606, "ground_truth": 1}, {"key": "35890902", "model": "llama", "target_model": "human", "recognition_score": 0.656658267072847, "ground_truth": 0}, {"key": "35890902", "model": "llama", "target_model": "claude", "recognition_score": 0.7839884625669961, "ground_truth": 0}, {"key": "35890902", "model": "llama", "target_model": "gpt4", "recognition_score": 0.579400396269235, "ground_truth": 0}, {"key": "35890902", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7969253779740931, "ground_truth": 0}, {"key": "37922330", "model": "llama", "target_model": "llama", "recognition_score": 0.8558511415911914, "ground_truth": 1}, {"key": "37922330", "model": "llama", "target_model": "human", "recognition_score": 0.7772998440299939, "ground_truth": 0}, {"key": "37922330", "model": "llama", "target_model": "claude", "recognition_score": 0.8670357585680394, "ground_truth": 0}, {"key": "37922330", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8757870041693888, "ground_truth": 0}, {"key": "37922330", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8438950929891299, "ground_truth": 0}, {"key": "30844962", "model": "llama", "target_model": "llama", "recognition_score": 0.5736784033634489, "ground_truth": 1}, {"key": "30844962", "model": "llama", "target_model": "human", "recognition_score": 0.5350984212225388, "ground_truth": 0}, {"key": "30844962", "model": "llama", "target_model": "claude", "recognition_score": 0.5926665924049311, "ground_truth": 0}, {"key": "30844962", "model": "llama", "target_model": "gpt4", "recognition_score": 0.43782349943437077, "ground_truth": 0}, {"key": "30844962", "model": "llama", "target_model": "gpt35", "recognition_score": 0.47268347746194267, "ground_truth": 0}, {"key": "36217333", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819900353199, "ground_truth": 1}, {"key": "36217333", "model": "llama", "target_model": "human", "recognition_score": 0.7090191404307719, "ground_truth": 0}, {"key": "36217333", "model": "llama", "target_model": "claude", "recognition_score": 0.6424324684802056, "ground_truth": 0}, {"key": "36217333", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7074046931722786, "ground_truth": 0}, {"key": "36217333", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5660185508970916, "ground_truth": 0}, {"key": "30816523", "model": "llama", "target_model": "llama", "recognition_score": 0.7490872225947093, "ground_truth": 1}, {"key": "30816523", "model": "llama", "target_model": "human", "recognition_score": 0.7201715012711432, "ground_truth": 0}, {"key": "30816523", "model": "llama", "target_model": "claude", "recognition_score": 0.8459424395536591, "ground_truth": 0}, {"key": "30816523", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7310585700598295, "ground_truth": 0}, {"key": "30816523", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7025300750132576, "ground_truth": 0}, {"key": "38900884", "model": "llama", "target_model": "llama", "recognition_score": 0.9569571504268714, "ground_truth": 1}, {"key": "38900884", "model": "llama", "target_model": "human", "recognition_score": 0.8816149104241441, "ground_truth": 0}, {"key": "38900884", "model": "llama", "target_model": "claude", "recognition_score": 0.9549844687537944, "ground_truth": 0}, {"key": "38900884", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9184802562019067, "ground_truth": 0}, {"key": "38900884", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8670357621198137, "ground_truth": 0}, {"key": "13890581", "model": "llama", "target_model": "llama", "recognition_score": 0.7662936639431827, "ground_truth": 1}, {"key": "13890581", "model": "llama", "target_model": "human", "recognition_score": 0.8596637479744851, "ground_truth": 0}, {"key": "13890581", "model": "llama", "target_model": "claude", "recognition_score": 0.8459424488657317, "ground_truth": 0}, {"key": "13890581", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9105453975812213, "ground_truth": 0}, {"key": "13890581", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8661324973276021, "ground_truth": 0}, {"key": "40194700", "model": "llama", "target_model": "llama", "recognition_score": 0.8164063759190566, "ground_truth": 1}, {"key": "40194700", "model": "llama", "target_model": "human", "recognition_score": 0.8902942268275581, "ground_truth": 0}, {"key": "40194700", "model": "llama", "target_model": "claude", "recognition_score": 0.9289263224273696, "ground_truth": 0}, {"key": "40194700", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9273632954430275, "ground_truth": 0}, {"key": "40194700", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8955226761025837, "ground_truth": 0}, {"key": "37903647", "model": "llama", "target_model": "llama", "recognition_score": 0.6020616091885952, "ground_truth": 1}, {"key": "37903647", "model": "llama", "target_model": "human", "recognition_score": 0.7122321794688664, "ground_truth": 0}, {"key": "37903647", "model": "llama", "target_model": "claude", "recognition_score": 0.4205995901820278, "ground_truth": 0}, {"key": "37903647", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5506073331377589, "ground_truth": 0}, {"key": "37903647", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5448014205957781, "ground_truth": 0}, {"key": "13291223", "model": "llama", "target_model": "llama", "recognition_score": 0.6334102879011346, "ground_truth": 1}, {"key": "13291223", "model": "llama", "target_model": "human", "recognition_score": 0.5506073564145627, "ground_truth": 0}, {"key": "13291223", "model": "llama", "target_model": "claude", "recognition_score": 0.7217432045814357, "ground_truth": 0}, {"key": "13291223", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7931059506886853, "ground_truth": 0}, {"key": "13291223", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5448014007124873, "ground_truth": 0}, {"key": "36052570", "model": "llama", "target_model": "llama", "recognition_score": 0.42632159114977725, "ground_truth": 1}, {"key": "36052570", "model": "llama", "target_model": "human", "recognition_score": 0.7813306230943632, "ground_truth": 0}, {"key": "36052570", "model": "llama", "target_model": "claude", "recognition_score": 0.7025300547508707, "ground_truth": 0}, {"key": "36052570", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6791787331420833, "ground_truth": 0}, {"key": "36052570", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5698526537701571, "ground_truth": 0}, {"key": "34944735", "model": "llama", "target_model": "llama", "recognition_score": 0.47268348415313793, "ground_truth": 1}, {"key": "34944735", "model": "llama", "target_model": "human", "recognition_score": 0.6513548676340386, "ground_truth": 0}, {"key": "34944735", "model": "llama", "target_model": "claude", "recognition_score": 0.7577943561914647, "ground_truth": 0}, {"key": "34944735", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6169358315460832, "ground_truth": 0}, {"key": "34944735", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6992544099111567, "ground_truth": 0}, {"key": "32159602", "model": "llama", "target_model": "llama", "recognition_score": 0.5888891167591228, "ground_truth": 1}, {"key": "32159602", "model": "llama", "target_model": "human", "recognition_score": 0.6057990455227216, "ground_truth": 0}, {"key": "32159602", "model": "llama", "target_model": "claude", "recognition_score": 0.46490156477344496, "ground_truth": 0}, {"key": "32159602", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5097643700007262, "ground_truth": 0}, {"key": "32159602", "model": "llama", "target_model": "gpt35", "recognition_score": 0.44360042485110324, "ground_truth": 0}, {"key": "34988915", "model": "llama", "target_model": "llama", "recognition_score": 0.5888891714764807, "ground_truth": 1}, {"key": "34988915", "model": "llama", "target_model": "human", "recognition_score": 0.5097643675301882, "ground_truth": 0}, {"key": "34988915", "model": "llama", "target_model": "claude", "recognition_score": 0.6132365436019552, "ground_truth": 0}, {"key": "34988915", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5640984837530114, "ground_truth": 0}, {"key": "34988915", "model": "llama", "target_model": "gpt35", "recognition_score": 0.635222436924894, "ground_truth": 0}, {"key": "37889203", "model": "llama", "target_model": "llama", "recognition_score": 0.9304582605948228, "ground_truth": 1}, {"key": "37889203", "model": "llama", "target_model": "human", "recognition_score": 0.9511422176936456, "ground_truth": 0}, {"key": "37889203", "model": "llama", "target_model": "claude", "recognition_score": 0.9224823431694031, "ground_truth": 0}, {"key": "37889203", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9477691430996928, "ground_truth": 0}, {"key": "37889203", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9594592608746001, "ground_truth": 0}, {"key": "33609927", "model": "llama", "target_model": "llama", "recognition_score": 0.27202455830434574, "ground_truth": 1}, {"key": "33609927", "model": "llama", "target_model": "human", "recognition_score": 0.517570863518566, "ground_truth": 0}, {"key": "33609927", "model": "llama", "target_model": "claude", "recognition_score": 0.19806417192735049, "ground_truth": 0}, {"key": "33609927", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5869964471529044, "ground_truth": 0}, {"key": "33609927", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4941409109987238, "ground_truth": 0}, {"key": "33578778", "model": "llama", "target_model": "llama", "recognition_score": 0.7325918319579802, "ground_truth": 1}, {"key": "33578778", "model": "llama", "target_model": "human", "recognition_score": 0.7201715089160475, "ground_truth": 0}, {"key": "33578778", "model": "llama", "target_model": "claude", "recognition_score": 0.8864204083399042, "ground_truth": 0}, {"key": "33578778", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7416740410117894, "ground_truth": 0}, {"key": "33578778", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8459424446701987, "ground_truth": 0}, {"key": "36888270", "model": "llama", "target_model": "llama", "recognition_score": 0.9385759635710009, "ground_truth": 1}, {"key": "36888270", "model": "llama", "target_model": "human", "recognition_score": 0.759225409787048, "ground_truth": 0}, {"key": "36888270", "model": "llama", "target_model": "claude", "recognition_score": 0.9268352785445387, "ground_truth": 0}, {"key": "36888270", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9136765313329902, "ground_truth": 0}, {"key": "36888270", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9196425360679326, "ground_truth": 0}, {"key": "36846007", "model": "llama", "target_model": "llama", "recognition_score": 0.9764905460172278, "ground_truth": 1}, {"key": "36846007", "model": "llama", "target_model": "human", "recognition_score": 0.9852713859938563, "ground_truth": 0}, {"key": "36846007", "model": "llama", "target_model": "claude", "recognition_score": 0.9766692305061185, "ground_truth": 0}, {"key": "36846007", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9612438075918194, "ground_truth": 0}, {"key": "36846007", "model": "llama", "target_model": "gpt35", "recognition_score": 0.984093607622854, "ground_truth": 0}, {"key": "31723471", "model": "llama", "target_model": "llama", "recognition_score": 0.8807970744559698, "ground_truth": 1}, {"key": "31723471", "model": "llama", "target_model": "human", "recognition_score": 0.727975420381643, "ground_truth": 0}, {"key": "31723471", "model": "llama", "target_model": "claude", "recognition_score": 0.8568122857224885, "ground_truth": 0}, {"key": "31723471", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8080672179579261, "ground_truth": 0}, {"key": "31723471", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8438951068061137, "ground_truth": 0}, {"key": "15921828", "model": "llama", "target_model": "llama", "recognition_score": 0.4629586136646598, "ground_truth": 1}, {"key": "15921828", "model": "llama", "target_model": "human", "recognition_score": 0.5370413647199841, "ground_truth": 0}, {"key": "15921828", "model": "llama", "target_model": "claude", "recognition_score": 0.588889114198247, "ground_truth": 0}, {"key": "15921828", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3007455946888441, "ground_truth": 0}, {"key": "15921828", "model": "llama", "target_model": "gpt35", "recognition_score": 0.46879065494431776, "ground_truth": 0}, {"key": "39109408", "model": "llama", "target_model": "llama", "recognition_score": 0.3311197521267246, "ground_truth": 1}, {"key": "39109408", "model": "llama", "target_model": "human", "recognition_score": 0.3757064647472998, "ground_truth": 0}, {"key": "39109408", "model": "llama", "target_model": "claude", "recognition_score": 0.40922079174464343, "ground_truth": 0}, {"key": "39109408", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3557748881649217, "ground_truth": 0}, {"key": "39109408", "model": "llama", "target_model": "gpt35", "recognition_score": 0.22815649177536562, "ground_truth": 0}, {"key": "20936833", "model": "llama", "target_model": "llama", "recognition_score": 0.12421301000707884, "ground_truth": 1}, {"key": "20936833", "model": "llama", "target_model": "human", "recognition_score": 0.14128141309404818, "ground_truth": 0}, {"key": "20936833", "model": "llama", "target_model": "claude", "recognition_score": 0.13477591581458487, "ground_truth": 0}, {"key": "20936833", "model": "llama", "target_model": "gpt4", "recognition_score": 0.11676401033222873, "ground_truth": 0}, {"key": "20936833", "model": "llama", "target_model": "gpt35", "recognition_score": 0.11436851776721248, "ground_truth": 0}, {"key": "36832879", "model": "llama", "target_model": "llama", "recognition_score": 0.718594397874847, "ground_truth": 1}, {"key": "36832879", "model": "llama", "target_model": "human", "recognition_score": 0.7534666596638268, "ground_truth": 0}, {"key": "36832879", "model": "llama", "target_model": "claude", "recognition_score": 0.8322366525042052, "ground_truth": 0}, {"key": "36832879", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8164063736583593, "ground_truth": 0}, {"key": "36832879", "model": "llama", "target_model": "gpt35", "recognition_score": 0.679178684607884, "ground_truth": 0}, {"key": "14958201", "model": "llama", "target_model": "llama", "recognition_score": 0.8469578419432915, "ground_truth": 1}, {"key": "14958201", "model": "llama", "target_model": "human", "recognition_score": 0.8856314738724161, "ground_truth": 0}, {"key": "14958201", "model": "llama", "target_model": "claude", "recognition_score": 0.7931059540801514, "ground_truth": 0}, {"key": "14958201", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7648916191137954, "ground_truth": 0}, {"key": "14958201", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8679338349724359, "ground_truth": 0}, {"key": "34352262", "model": "llama", "target_model": "llama", "recognition_score": 0.22135068134478442, "ground_truth": 1}, {"key": "34352262", "model": "llama", "target_model": "human", "recognition_score": 0.4244120204647133, "ground_truth": 0}, {"key": "34352262", "model": "llama", "target_model": "claude", "recognition_score": 0.2030746333112266, "ground_truth": 0}, {"key": "34352262", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3328523430304414, "ground_truth": 0}, {"key": "34352262", "model": "llama", "target_model": "gpt35", "recognition_score": 0.2704802143841206, "ground_truth": 0}, {"key": "39805395", "model": "llama", "target_model": "llama", "recognition_score": 0.5794003905022993, "ground_truth": 1}, {"key": "39805395", "model": "llama", "target_model": "human", "recognition_score": 0.3593641282898298, "ground_truth": 0}, {"key": "39805395", "model": "llama", "target_model": "claude", "recognition_score": 0.4687905886495771, "ground_truth": 0}, {"key": "39805395", "model": "llama", "target_model": "gpt4", "recognition_score": 0.42250460552628605, "ground_truth": 0}, {"key": "39805395", "model": "llama", "target_model": "gpt35", "recognition_score": 0.41489884256036, "ground_truth": 0}, {"key": "34303109", "model": "llama", "target_model": "llama", "recognition_score": 0.38861806306836016, "ground_truth": 1}, {"key": "34303109", "model": "llama", "target_model": "human", "recognition_score": 0.41111086785242884, "ground_truth": 0}, {"key": "34303109", "model": "llama", "target_model": "claude", "recognition_score": 0.403566865144054, "ground_truth": 0}, {"key": "34303109", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5602526411385315, "ground_truth": 0}, {"key": "34303109", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5964331341671253, "ground_truth": 0}, {"key": "39939090", "model": "llama", "target_model": "llama", "recognition_score": 0.9489172593859877, "ground_truth": 1}, {"key": "39939090", "model": "llama", "target_model": "human", "recognition_score": 0.9079671467104707, "ground_truth": 0}, {"key": "39939090", "model": "llama", "target_model": "claude", "recognition_score": 0.9161096103775859, "ground_truth": 0}, {"key": "39939090", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9224823492424038, "ground_truth": 0}, {"key": "39939090", "model": "llama", "target_model": "gpt35", "recognition_score": 0.925229958163945, "ground_truth": 0}, {"key": "29347771", "model": "llama", "target_model": "llama", "recognition_score": 0.7606506672251474, "ground_truth": 1}, {"key": "29347771", "model": "llama", "target_model": "human", "recognition_score": 0.8596637363669728, "ground_truth": 0}, {"key": "29347771", "model": "llama", "target_model": "claude", "recognition_score": 0.8998277881724269, "ground_truth": 0}, {"key": "29347771", "model": "llama", "target_model": "gpt4", "recognition_score": 0.808067222878404, "ground_truth": 0}, {"key": "29347771", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9485372384418498, "ground_truth": 0}, {"key": "36783415", "model": "llama", "target_model": "llama", "recognition_score": 0.8031737841060694, "ground_truth": 1}, {"key": "36783415", "model": "llama", "target_model": "human", "recognition_score": 0.5156198713991018, "ground_truth": 0}, {"key": "36783415", "model": "llama", "target_model": "claude", "recognition_score": 0.7138307531066362, "ground_truth": 0}, {"key": "36783415", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7662936648679586, "ground_truth": 0}, {"key": "36783415", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5389832262451201, "ground_truth": 0}, {"key": "37935687", "model": "llama", "target_model": "llama", "recognition_score": 0.7577943914676133, "ground_truth": 1}, {"key": "37935687", "model": "llama", "target_model": "human", "recognition_score": 0.839733975524667, "ground_truth": 0}, {"key": "37935687", "model": "llama", "target_model": "claude", "recognition_score": 0.8407825925101059, "ground_truth": 0}, {"key": "37935687", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8187367824215276, "ground_truth": 0}, {"key": "37935687", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8840392840910056, "ground_truth": 0}, {"key": "40260829", "model": "llama", "target_model": "llama", "recognition_score": 0.7386690644086414, "ground_truth": 1}, {"key": "40260829", "model": "llama", "target_model": "human", "recognition_score": 0.9118099502755486, "ground_truth": 0}, {"key": "40260829", "model": "llama", "target_model": "claude", "recognition_score": 0.9184802429779825, "ground_truth": 0}, {"key": "40260829", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8606036089335345, "ground_truth": 0}, {"key": "40260829", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9142907165606771, "ground_truth": 0}, {"key": "36478199", "model": "llama", "target_model": "llama", "recognition_score": 0.8019358039890291, "ground_truth": 1}, {"key": "36478199", "model": "llama", "target_model": "human", "recognition_score": 0.8187368033394969, "ground_truth": 0}, {"key": "36478199", "model": "llama", "target_model": "claude", "recognition_score": 0.8354835443117468, "ground_truth": 0}, {"key": "36478199", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7592253993376192, "ground_truth": 0}, {"key": "36478199", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8092759800923721, "ground_truth": 0}, {"key": "34541803", "model": "llama", "target_model": "llama", "recognition_score": 0.4225046231035302, "ground_truth": 1}, {"key": "34541803", "model": "llama", "target_model": "human", "recognition_score": 0.30074558775402294, "ground_truth": 0}, {"key": "34541803", "model": "llama", "target_model": "claude", "recognition_score": 0.309023693208385, "ground_truth": 0}, {"key": "34541803", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5389832162559952, "ground_truth": 0}, {"key": "34541803", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6477982179362701, "ground_truth": 0}, {"key": "35360841", "model": "llama", "target_model": "llama", "recognition_score": 0.9257686340619478, "ground_truth": 1}, {"key": "35360841", "model": "llama", "target_model": "human", "recognition_score": 0.8723473663591192, "ground_truth": 0}, {"key": "35360841", "model": "llama", "target_model": "claude", "recognition_score": 0.9184802443661289, "ground_truth": 0}, {"key": "35360841", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8175744774287609, "ground_truth": 0}, {"key": "35360841", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8652240723804473, "ground_truth": 0}, {"key": "35550407", "model": "llama", "target_model": "llama", "recognition_score": 0.8848377643832719, "ground_truth": 1}, {"key": "35550407", "model": "llama", "target_model": "human", "recognition_score": 0.7431680074132055, "ground_truth": 0}, {"key": "35550407", "model": "llama", "target_model": "claude", "recognition_score": 0.8044059032616829, "ground_truth": 0}, {"key": "35550407", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8386797563874565, "ground_truth": 0}, {"key": "35550407", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7386690878000809, "ground_truth": 0}, {"key": "37561590", "model": "llama", "target_model": "llama", "recognition_score": 0.8824278764063881, "ground_truth": 1}, {"key": "37561590", "model": "llama", "target_model": "human", "recognition_score": 0.9529258242477332, "ground_truth": 0}, {"key": "37561590", "model": "llama", "target_model": "claude", "recognition_score": 0.9795114445979201, "ground_truth": 0}, {"key": "37561590", "model": "llama", "target_model": "gpt4", "recognition_score": 0.861538209895665, "ground_truth": 0}, {"key": "37561590", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8984105549082282, "ground_truth": 0}, {"key": "39328843", "model": "llama", "target_model": "llama", "recognition_score": 0.9603611641924217, "ground_truth": 1}, {"key": "39328843", "model": "llama", "target_model": "human", "recognition_score": 0.9693241944815191, "ground_truth": 0}, {"key": "39328843", "model": "llama", "target_model": "claude", "recognition_score": 0.9790357603738659, "ground_truth": 0}, {"key": "39328843", "model": "llama", "target_model": "gpt4", "recognition_score": 0.971992476349475, "ground_truth": 0}, {"key": "39328843", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9759464466984772, "ground_truth": 0}, {"key": "35389665", "model": "llama", "target_model": "llama", "recognition_score": 0.9820137885558912, "ground_truth": 1}, {"key": "35389665", "model": "llama", "target_model": "human", "recognition_score": 0.9852713863230619, "ground_truth": 0}, {"key": "35389665", "model": "llama", "target_model": "claude", "recognition_score": 0.9898303422977772, "ground_truth": 0}, {"key": "35389665", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9833429607393781, "ground_truth": 0}, {"key": "35389665", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9834704408726034, "ground_truth": 0}, {"key": "33080187", "model": "llama", "target_model": "llama", "recognition_score": 0.29583987039463444, "ground_truth": 1}, {"key": "33080187", "model": "llama", "target_model": "human", "recognition_score": 0.1225232068673873, "ground_truth": 0}, {"key": "33080187", "model": "llama", "target_model": "claude", "recognition_score": 0.11757213401264467, "ground_truth": 0}, {"key": "33080187", "model": "llama", "target_model": "gpt4", "recognition_score": 0.24798743430867487, "ground_truth": 0}, {"key": "33080187", "model": "llama", "target_model": "gpt35", "recognition_score": 0.30902372640195525, "ground_truth": 0}, {"key": "38636995", "model": "llama", "target_model": "llama", "recognition_score": 0.6723317044949051, "ground_truth": 1}, {"key": "38636995", "model": "llama", "target_model": "human", "recognition_score": 0.8766343792477785, "ground_truth": 0}, {"key": "38636995", "model": "llama", "target_model": "claude", "recognition_score": 0.8152324953377916, "ground_truth": 0}, {"key": "38636995", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9118099567642031, "ground_truth": 0}, {"key": "38636995", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8879840530502442, "ground_truth": 0}, {"key": "18536236", "model": "llama", "target_model": "llama", "recognition_score": 0.8449215289284813, "ground_truth": 1}, {"key": "18536236", "model": "llama", "target_model": "human", "recognition_score": 0.8175744842781981, "ground_truth": 0}, {"key": "18536236", "model": "llama", "target_model": "claude", "recognition_score": 0.7634837659076302, "ground_truth": 0}, {"key": "18536236", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8568123082234331, "ground_truth": 0}, {"key": "18536236", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7041601477581008, "ground_truth": 0}, {"key": "36289151", "model": "llama", "target_model": "llama", "recognition_score": 0.6825737429562033, "ground_truth": 1}, {"key": "36289151", "model": "llama", "target_model": "human", "recognition_score": 0.6808786118544229, "ground_truth": 0}, {"key": "36289151", "model": "llama", "target_model": "claude", "recognition_score": 0.5851011690725388, "ground_truth": 0}, {"key": "36289151", "model": "llama", "target_model": "gpt4", "recognition_score": 0.661922887367396, "ground_truth": 0}, {"key": "36289151", "model": "llama", "target_model": "gpt35", "recognition_score": 0.613236555157345, "ground_truth": 0}, {"key": "23017045", "model": "llama", "target_model": "llama", "recognition_score": 0.8140527994427795, "ground_truth": 1}, {"key": "23017045", "model": "llama", "target_model": "human", "recognition_score": 0.789233702092378, "ground_truth": 0}, {"key": "23017045", "model": "llama", "target_model": "claude", "recognition_score": 0.8705972637195751, "ground_truth": 0}, {"key": "23017045", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9142907178703041, "ground_truth": 0}, {"key": "23017045", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8397339588897569, "ground_truth": 0}, {"key": "36418082", "model": "llama", "target_model": "llama", "recognition_score": 0.8596637664350378, "ground_truth": 1}, {"key": "36418082", "model": "llama", "target_model": "human", "recognition_score": 0.7520125964021867, "ground_truth": 0}, {"key": "36418082", "model": "llama", "target_model": "claude", "recognition_score": 0.89405170820637, "ground_truth": 0}, {"key": "36418082", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8539127735962216, "ground_truth": 0}, {"key": "36418082", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8198933413682777, "ground_truth": 0}, {"key": "34396551", "model": "llama", "target_model": "llama", "recognition_score": 0.6279512136789112, "ground_truth": 1}, {"key": "34396551", "model": "llama", "target_model": "human", "recognition_score": 0.7799928963977716, "ground_truth": 0}, {"key": "34396551", "model": "llama", "target_model": "claude", "recognition_score": 0.7401743786091762, "ground_truth": 0}, {"key": "34396551", "model": "llama", "target_model": "gpt4", "recognition_score": 0.633410273933062, "ground_truth": 0}, {"key": "34396551", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5736784085714115, "ground_truth": 0}, {"key": "39720944", "model": "llama", "target_model": "llama", "recognition_score": 0.9525741246910316, "ground_truth": 1}, {"key": "39720944", "model": "llama", "target_model": "human", "recognition_score": 0.940353057940351, "ground_truth": 0}, {"key": "39720944", "model": "llama", "target_model": "claude", "recognition_score": 0.9511422230247739, "ground_truth": 0}, {"key": "39720944", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8568123025300505, "ground_truth": 0}, {"key": "39720944", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9594592595935346, "ground_truth": 0}, {"key": "35884842", "model": "llama", "target_model": "llama", "recognition_score": 0.6654105384480469, "ground_truth": 1}, {"key": "35884842", "model": "llama", "target_model": "human", "recognition_score": 0.4804786975055632, "ground_truth": 0}, {"key": "35884842", "model": "llama", "target_model": "claude", "recognition_score": 0.40922079663919, "ground_truth": 0}, {"key": "35884842", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5292633811072497, "ground_truth": 0}, {"key": "35884842", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5602526459768795, "ground_truth": 0}, {"key": "35403375", "model": "llama", "target_model": "llama", "recognition_score": 0.2845760258537621, "ground_truth": 1}, {"key": "35403375", "model": "llama", "target_model": "human", "recognition_score": 0.2056150317814881, "ground_truth": 0}, {"key": "35403375", "model": "llama", "target_model": "claude", "recognition_score": 0.353986306810799, "ground_truth": 0}, {"key": "35403375", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3468730722799856, "ground_truth": 0}, {"key": "35403375", "model": "llama", "target_model": "gpt35", "recognition_score": 0.1699562218300931, "ground_truth": 0}, {"key": "26341324", "model": "llama", "target_model": "llama", "recognition_score": 0.9190632882598455, "ground_truth": 1}, {"key": "26341324", "model": "llama", "target_model": "human", "recognition_score": 0.9136765265856988, "ground_truth": 0}, {"key": "26341324", "model": "llama", "target_model": "claude", "recognition_score": 0.8670357555101466, "ground_truth": 0}, {"key": "26341324", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9099070061569449, "ground_truth": 0}, {"key": "26341324", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8233283856834733, "ground_truth": 0}, {"key": "19212345", "model": "llama", "target_model": "llama", "recognition_score": 0.9273632868795771, "ground_truth": 1}, {"key": "19212345", "model": "llama", "target_model": "human", "recognition_score": 0.8128673207236562, "ground_truth": 0}, {"key": "19212345", "model": "llama", "target_model": "claude", "recognition_score": 0.9230391586569145, "ground_truth": 0}, {"key": "19212345", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8489722177301627, "ground_truth": 0}, {"key": "19212345", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9511422205116465, "ground_truth": 0}, {"key": "30548367", "model": "llama", "target_model": "llama", "recognition_score": 0.870597264361363, "ground_truth": 1}, {"key": "30548367", "model": "llama", "target_model": "human", "recognition_score": 0.8438950993002874, "ground_truth": 0}, {"key": "30548367", "model": "llama", "target_model": "claude", "recognition_score": 0.9458012737623347, "ground_truth": 0}, {"key": "30548367", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8757869850953972, "ground_truth": 0}, {"key": "30548367", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8469578588030762, "ground_truth": 0}, {"key": "37919402", "model": "llama", "target_model": "llama", "recognition_score": 0.9458012678907189, "ground_truth": 1}, {"key": "37919402", "model": "llama", "target_model": "human", "recognition_score": 0.9575961677183323, "ground_truth": 0}, {"key": "37919402", "model": "llama", "target_model": "claude", "recognition_score": 0.9362850009643215, "ground_truth": 0}, {"key": "37919402", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9539660985652572, "ground_truth": 0}, {"key": "37919402", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9546474225250422, "ground_truth": 0}, {"key": "39995133", "model": "llama", "target_model": "llama", "recognition_score": 0.9753900687771997, "ground_truth": 1}, {"key": "39995133", "model": "llama", "target_model": "human", "recognition_score": 0.9893474892918867, "ground_truth": 0}, {"key": "39995133", "model": "llama", "target_model": "claude", "recognition_score": 0.9748211623571097, "ground_truth": 0}, {"key": "39995133", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9504109792231669, "ground_truth": 0}, {"key": "39995133", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9273632943642123, "ground_truth": 0}, {"key": "40249088", "model": "llama", "target_model": "llama", "recognition_score": 0.8152324945772025, "ground_truth": 1}, {"key": "40249088", "model": "llama", "target_model": "human", "recognition_score": 0.9284087910549143, "ground_truth": 0}, {"key": "40249088", "model": "llama", "target_model": "claude", "recognition_score": 0.7662936311184637, "ground_truth": 0}, {"key": "40249088", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8705972560631147, "ground_truth": 0}, {"key": "40249088", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9092645143530255, "ground_truth": 0}, {"key": "40254388", "model": "llama", "target_model": "llama", "recognition_score": 0.6352224543285102, "ground_truth": 1}, {"key": "40254388", "model": "llama", "target_model": "human", "recognition_score": 0.7690802476148619, "ground_truth": 0}, {"key": "40254388", "model": "llama", "target_model": "claude", "recognition_score": 0.6001883798854765, "ground_truth": 0}, {"key": "40254388", "model": "llama", "target_model": "gpt4", "recognition_score": 0.806852629075797, "ground_truth": 0}, {"key": "40254388", "model": "llama", "target_model": "gpt35", "recognition_score": 0.763483767186921, "ground_truth": 0}, {"key": "31995230", "model": "llama", "target_model": "llama", "recognition_score": 0.9005297892853887, "ground_truth": 1}, {"key": "31995230", "model": "llama", "target_model": "human", "recognition_score": 0.8311430415742063, "ground_truth": 0}, {"key": "31995230", "model": "llama", "target_model": "claude", "recognition_score": 0.932453317134429, "ground_truth": 0}, {"key": "31995230", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9059898134601283, "ground_truth": 0}, {"key": "31995230", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9600626848826118, "ground_truth": 0}, {"key": "38632129", "model": "llama", "target_model": "llama", "recognition_score": 0.9241418274800437, "ground_truth": 1}, {"key": "38632129", "model": "llama", "target_model": "human", "recognition_score": 0.9329437156886874, "ground_truth": 0}, {"key": "38632129", "model": "llama", "target_model": "claude", "recognition_score": 0.9118099596821886, "ground_truth": 0}, {"key": "38632129", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7839884735235795, "ground_truth": 0}, {"key": "38632129", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7879311953709953, "ground_truth": 0}, {"key": "35720795", "model": "llama", "target_model": "llama", "recognition_score": 0.8807970727522925, "ground_truth": 1}, {"key": "35720795", "model": "llama", "target_model": "human", "recognition_score": 0.8558511461111008, "ground_truth": 0}, {"key": "35720795", "model": "llama", "target_model": "claude", "recognition_score": 0.7090191115778279, "ground_truth": 0}, {"key": "35720795", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9161096092128659, "ground_truth": 0}, {"key": "35720795", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8278281420063239, "ground_truth": 0}, {"key": "23906759", "model": "llama", "target_model": "llama", "recognition_score": 0.7853085966869923, "ground_truth": 1}, {"key": "23906759", "model": "llama", "target_model": "human", "recognition_score": 0.9142907250020599, "ground_truth": 0}, {"key": "23906759", "model": "llama", "target_model": "claude", "recognition_score": 0.9213576161934132, "ground_truth": 0}, {"key": "23906759", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8910549414089921, "ground_truth": 0}, {"key": "23906759", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9184802458906933, "ground_truth": 0}, {"key": "19410108", "model": "llama", "target_model": "llama", "recognition_score": 0.73105857054311, "ground_truth": 1}, {"key": "19410108", "model": "llama", "target_model": "human", "recognition_score": 0.9039745127271186, "ground_truth": 0}, {"key": "19410108", "model": "llama", "target_model": "claude", "recognition_score": 0.8221891345107742, "ground_truth": 0}, {"key": "19410108", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8267117962831063, "ground_truth": 0}, {"key": "19410108", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8031738004583017, "ground_truth": 0}, {"key": "30745137", "model": "llama", "target_model": "llama", "recognition_score": 0.6406358483476934, "ground_truth": 1}, {"key": "30745137", "model": "llama", "target_model": "human", "recognition_score": 0.6095241616419624, "ground_truth": 0}, {"key": "30745137", "model": "llama", "target_model": "claude", "recognition_score": 0.775944531163814, "ground_truth": 0}, {"key": "30745137", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6671476914988302, "ground_truth": 0}, {"key": "30745137", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7759445504920454, "ground_truth": 0}, {"key": "26553115", "model": "llama", "target_model": "llama", "recognition_score": 0.720171514482537, "ground_truth": 1}, {"key": "26553115", "model": "llama", "target_model": "human", "recognition_score": 0.37387584416577935, "ground_truth": 0}, {"key": "26553115", "model": "llama", "target_model": "claude", "recognition_score": 0.45907614799892876, "ground_truth": 0}, {"key": "26553115", "model": "llama", "target_model": "gpt4", "recognition_score": 0.607663164818489, "ground_truth": 0}, {"key": "26553115", "model": "llama", "target_model": "gpt35", "recognition_score": 0.2845760128528521, "ground_truth": 0}, {"key": "37872311", "model": "llama", "target_model": "llama", "recognition_score": 0.8895288441301566, "ground_truth": 1}, {"key": "37872311", "model": "llama", "target_model": "human", "recognition_score": 0.7279754343270048, "ground_truth": 0}, {"key": "37872311", "model": "llama", "target_model": "claude", "recognition_score": 0.9362850068829192, "ground_truth": 0}, {"key": "37872311", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9453993910496425, "ground_truth": 0}, {"key": "37872311", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9539660937171486, "ground_truth": 0}, {"key": "35553131", "model": "llama", "target_model": "llama", "recognition_score": 0.8714748618184109, "ground_truth": 1}, {"key": "35553131", "model": "llama", "target_model": "human", "recognition_score": 0.9339146153115292, "ground_truth": 0}, {"key": "35553131", "model": "llama", "target_model": "claude", "recognition_score": 0.9394706106545971, "ground_truth": 0}, {"key": "35553131", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8255897051155201, "ground_truth": 0}, {"key": "35553131", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9124361611043807, "ground_truth": 0}, {"key": "39038936", "model": "llama", "target_model": "llama", "recognition_score": 0.832236666391838, "ground_truth": 1}, {"key": "39038936", "model": "llama", "target_model": "human", "recognition_score": 0.940789747540513, "ground_truth": 0}, {"key": "39038936", "model": "llama", "target_model": "claude", "recognition_score": 0.7676898475874114, "ground_truth": 0}, {"key": "39038936", "model": "llama", "target_model": "gpt4", "recognition_score": 0.795658105355842, "ground_truth": 0}, {"key": "39038936", "model": "llama", "target_model": "gpt35", "recognition_score": 0.747615957753758, "ground_truth": 0}, {"key": "38735486", "model": "llama", "target_model": "llama", "recognition_score": 0.9842154384774277, "ground_truth": 1}, {"key": "38735486", "model": "llama", "target_model": "human", "recognition_score": 0.9878528290151694, "ground_truth": 0}, {"key": "38735486", "model": "llama", "target_model": "claude", "recognition_score": 0.9559813491626391, "ground_truth": 0}, {"key": "38735486", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9759464486653707, "ground_truth": 0}, {"key": "38735486", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9832145077914518, "ground_truth": 0}, {"key": "17087845", "model": "llama", "target_model": "llama", "recognition_score": 0.7233094701578283, "ground_truth": 1}, {"key": "17087845", "model": "llama", "target_model": "human", "recognition_score": 0.5409238786645281, "ground_truth": 0}, {"key": "17087845", "model": "llama", "target_model": "claude", "recognition_score": 0.6926419882174533, "ground_truth": 0}, {"key": "17087845", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7620701211351654, "ground_truth": 0}, {"key": "17087845", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5698526503766846, "ground_truth": 0}, {"key": "37443011", "model": "llama", "target_model": "llama", "recognition_score": 0.86060362226077, "ground_truth": 1}, {"key": "37443011", "model": "llama", "target_model": "human", "recognition_score": 0.8221891273613726, "ground_truth": 0}, {"key": "37443011", "model": "llama", "target_model": "claude", "recognition_score": 0.8210441027415096, "ground_truth": 0}, {"key": "37443011", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8925625258945021, "ground_truth": 0}, {"key": "37443011", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7634837673201125, "ground_truth": 0}, {"key": "36855749", "model": "llama", "target_model": "llama", "recognition_score": 0.8289388117232711, "ground_truth": 1}, {"key": "36855749", "model": "llama", "target_model": "human", "recognition_score": 0.9324533162961381, "ground_truth": 0}, {"key": "36855749", "model": "llama", "target_model": "claude", "recognition_score": 0.8969755677195733, "ground_truth": 0}, {"key": "36855749", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9184802448024387, "ground_truth": 0}, {"key": "36855749", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8887587989640714, "ground_truth": 0}, {"key": "35613141", "model": "llama", "target_model": "llama", "recognition_score": 0.8548846385853415, "ground_truth": 1}, {"key": "35613141", "model": "llama", "target_model": "human", "recognition_score": 0.906653115621598, "ground_truth": 0}, {"key": "35613141", "model": "llama", "target_model": "claude", "recognition_score": 0.926303734935637, "ground_truth": 0}, {"key": "35613141", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7446563542619703, "ground_truth": 0}, {"key": "35613141", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9241418211324498, "ground_truth": 0}, {"key": "39088847", "model": "llama", "target_model": "llama", "recognition_score": 0.4804786764272868, "ground_truth": 1}, {"key": "39088847", "model": "llama", "target_model": "human", "recognition_score": 0.5312093487887517, "ground_truth": 0}, {"key": "39088847", "model": "llama", "target_model": "claude", "recognition_score": 0.5525397149058036, "ground_truth": 0}, {"key": "39088847", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4186969161131812, "ground_truth": 0}, {"key": "39088847", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4649015511087203, "ground_truth": 0}, {"key": "33197277", "model": "llama", "target_model": "llama", "recognition_score": 0.7786493061964127, "ground_truth": 1}, {"key": "33197277", "model": "llama", "target_model": "human", "recognition_score": 0.9473810460985035, "ground_truth": 0}, {"key": "33197277", "model": "llama", "target_model": "claude", "recognition_score": 0.959762051431905, "ground_truth": 0}, {"key": "33197277", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8991213805775271, "ground_truth": 0}, {"key": "33197277", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8376199482581527, "ground_truth": 0}, {"key": "33815489", "model": "llama", "target_model": "llama", "recognition_score": 0.7025300561839394, "ground_truth": 1}, {"key": "33815489", "model": "llama", "target_model": "human", "recognition_score": 0.7371581698464007, "ground_truth": 0}, {"key": "33815489", "model": "llama", "target_model": "claude", "recognition_score": 0.7122321816180069, "ground_truth": 0}, {"key": "33815489", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6943026892670509, "ground_truth": 0}, {"key": "33815489", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7620701311996606, "ground_truth": 0}, {"key": "35862754", "model": "llama", "target_model": "llama", "recognition_score": 0.9235923186991768, "ground_truth": 1}, {"key": "35862754", "model": "llama", "target_model": "human", "recognition_score": 0.854884650351415, "ground_truth": 0}, {"key": "35862754", "model": "llama", "target_model": "claude", "recognition_score": 0.8679338434204354, "ground_truth": 0}, {"key": "35862754", "model": "llama", "target_model": "gpt4", "recognition_score": 0.909264511455575, "ground_truth": 0}, {"key": "35862754", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8962513610006182, "ground_truth": 0}, {"key": "36080615", "model": "llama", "target_model": "llama", "recognition_score": 0.6370307835351718, "ground_truth": 1}, {"key": "36080615", "model": "llama", "target_model": "human", "recognition_score": 0.511716588480447, "ground_truth": 0}, {"key": "36080615", "model": "llama", "target_model": "claude", "recognition_score": 0.7476159477543152, "ground_truth": 0}, {"key": "36080615", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7106283063944221, "ground_truth": 0}, {"key": "36080615", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6654105552044554, "ground_truth": 0}, {"key": "22822742", "model": "llama", "target_model": "llama", "recognition_score": 0.8832359685452742, "ground_truth": 1}, {"key": "22822742", "model": "llama", "target_model": "human", "recognition_score": 0.9539661021241541, "ground_truth": 0}, {"key": "22822742", "model": "llama", "target_model": "claude", "recognition_score": 0.9653811631360629, "ground_truth": 0}, {"key": "22822742", "model": "llama", "target_model": "gpt4", "recognition_score": 0.938124015778431, "ground_truth": 0}, {"key": "22822742", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9529258304970667, "ground_truth": 0}, {"key": "39747536", "model": "llama", "target_model": "llama", "recognition_score": 0.8365545575854607, "ground_truth": 1}, {"key": "39747536", "model": "llama", "target_model": "human", "recognition_score": 0.8164063822971395, "ground_truth": 0}, {"key": "39747536", "model": "llama", "target_model": "claude", "recognition_score": 0.7431680008031495, "ground_truth": 0}, {"key": "39747536", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7185943962104947, "ground_truth": 0}, {"key": "39747536", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7106282963813769, "ground_truth": 0}, {"key": "34218396", "model": "llama", "target_model": "llama", "recognition_score": 0.9394706150579042, "ground_truth": 1}, {"key": "34218396", "model": "llama", "target_model": "human", "recognition_score": 0.9032942048736549, "ground_truth": 0}, {"key": "34218396", "model": "llama", "target_model": "claude", "recognition_score": 0.9412234479130076, "ground_truth": 0}, {"key": "34218396", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8824278602592411, "ground_truth": 0}, {"key": "34218396", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8652240871323181, "ground_truth": 0}, {"key": "39150388", "model": "llama", "target_model": "llama", "recognition_score": 0.721743197073489, "ground_truth": 1}, {"key": "39150388", "model": "llama", "target_model": "human", "recognition_score": 0.6601723592782599, "ground_truth": 0}, {"key": "39150388", "model": "llama", "target_model": "claude", "recognition_score": 0.7476159449720453, "ground_truth": 0}, {"key": "39150388", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6671476725401702, "ground_truth": 0}, {"key": "39150388", "model": "llama", "target_model": "gpt35", "recognition_score": 0.38121957616765917, "ground_truth": 0}, {"key": "28765782", "model": "llama", "target_model": "llama", "recognition_score": 0.9046505360978506, "ground_truth": 1}, {"key": "28765782", "model": "llama", "target_model": "human", "recognition_score": 0.8848377733475293, "ground_truth": 0}, {"key": "28765782", "model": "llama", "target_model": "claude", "recognition_score": 0.8918110488756955, "ground_truth": 0}, {"key": "28765782", "model": "llama", "target_model": "gpt4", "recognition_score": 0.941654155328735, "ground_truth": 0}, {"key": "28765782", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8529354836077669, "ground_truth": 0}, {"key": "35828022", "model": "llama", "target_model": "llama", "recognition_score": 0.775944548474918, "ground_truth": 1}, {"key": "35828022", "model": "llama", "target_model": "human", "recognition_score": 0.6566582583951269, "ground_truth": 0}, {"key": "35828022", "model": "llama", "target_model": "claude", "recognition_score": 0.7446563400897841, "ground_truth": 0}, {"key": "35828022", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6774740130026801, "ground_truth": 0}, {"key": "35828022", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8418256517679226, "ground_truth": 0}, {"key": "27717735", "model": "llama", "target_model": "llama", "recognition_score": 0.6169358292730457, "ground_truth": 1}, {"key": "27717735", "model": "llama", "target_model": "human", "recognition_score": 0.8210441003933896, "ground_truth": 0}, {"key": "27717735", "model": "llama", "target_model": "claude", "recognition_score": 0.5964331464018664, "ground_truth": 0}, {"key": "27717735", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7826624836399292, "ground_truth": 0}, {"key": "27717735", "model": "llama", "target_model": "gpt35", "recognition_score": 0.756357595003137, "ground_truth": 0}, {"key": "37977826", "model": "llama", "target_model": "llama", "recognition_score": 0.8056321755649624, "ground_truth": 1}, {"key": "37977826", "model": "llama", "target_model": "human", "recognition_score": 0.6169358465779419, "ground_truth": 0}, {"key": "37977826", "model": "llama", "target_model": "claude", "recognition_score": 0.7879311867341514, "ground_truth": 0}, {"key": "37977826", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7401743740824347, "ground_truth": 0}, {"key": "37977826", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7563575677388518, "ground_truth": 0}, {"key": "31768588", "model": "llama", "target_model": "llama", "recognition_score": 0.9556514181345047, "ground_truth": 1}, {"key": "31768588", "model": "llama", "target_model": "human", "recognition_score": 0.9840936100283483, "ground_truth": 0}, {"key": "31768588", "model": "llama", "target_model": "claude", "recognition_score": 0.9609517132417398, "ground_truth": 0}, {"key": "31768588", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9012274140589353, "ground_truth": 0}, {"key": "31768588", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9213576247608177, "ground_truth": 0}, {"key": "37183351", "model": "llama", "target_model": "llama", "recognition_score": 0.6039318317502324, "ground_truth": 1}, {"key": "37183351", "model": "llama", "target_model": "human", "recognition_score": 0.36658977313688706, "ground_truth": 0}, {"key": "37183351", "model": "llama", "target_model": "claude", "recognition_score": 0.5794003985103615, "ground_truth": 0}, {"key": "37183351", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5888891214680222, "ground_truth": 0}, {"key": "37183351", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5926666235564906, "ground_truth": 0}, {"key": "39622090", "model": "llama", "target_model": "llama", "recognition_score": 0.6406358433268612, "ground_truth": 1}, {"key": "39622090", "model": "llama", "target_model": "human", "recognition_score": 0.5136684716526089, "ground_truth": 0}, {"key": "39622090", "model": "llama", "target_model": "claude", "recognition_score": 0.6859494358859419, "ground_truth": 0}, {"key": "39622090", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5621764893194331, "ground_truth": 0}, {"key": "39622090", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3611647241346406, "ground_truth": 0}, {"key": "39272756", "model": "llama", "target_model": "llama", "recognition_score": 0.8006920129254592, "ground_truth": 1}, {"key": "39272756", "model": "llama", "target_model": "human", "recognition_score": 0.6976088954451767, "ground_truth": 0}, {"key": "39272756", "model": "llama", "target_model": "claude", "recognition_score": 0.6242935571977298, "ground_truth": 0}, {"key": "39272756", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7839884646127391, "ground_truth": 0}, {"key": "39272756", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7563575670287912, "ground_truth": 0}, {"key": "32138822", "model": "llama", "target_model": "llama", "recognition_score": 0.8539127562482608, "ground_truth": 1}, {"key": "32138822", "model": "llama", "target_model": "human", "recognition_score": 0.8499711721013041, "ground_truth": 0}, {"key": "32138822", "model": "llama", "target_model": "claude", "recognition_score": 0.80317376522601, "ground_truth": 0}, {"key": "32138822", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9304582568574752, "ground_truth": 0}, {"key": "32138822", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8848377724664024, "ground_truth": 0}, {"key": "31070114", "model": "llama", "target_model": "llama", "recognition_score": 0.27048020703441134, "ground_truth": 1}, {"key": "31070114", "model": "llama", "target_model": "human", "recognition_score": 0.18476752186083129, "ground_truth": 0}, {"key": "31070114", "model": "llama", "target_model": "claude", "recognition_score": 0.28776780972416915, "ground_truth": 0}, {"key": "31070114", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2094696800639735, "ground_truth": 0}, {"key": "31070114", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4111108740514996, "ground_truth": 0}, {"key": "39652762", "model": "llama", "target_model": "llama", "recognition_score": 0.9621075778400537, "ground_truth": 1}, {"key": "39652762", "model": "llama", "target_model": "human", "recognition_score": 0.9273632959207371, "ground_truth": 0}, {"key": "39652762", "model": "llama", "target_model": "claude", "recognition_score": 0.8955226835996741, "ground_truth": 0}, {"key": "39652762", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8175744649022332, "ground_truth": 0}, {"key": "39652762", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8740772300547658, "ground_truth": 0}, {"key": "33258866", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819895740856, "ground_truth": 1}, {"key": "33258866", "model": "llama", "target_model": "human", "recognition_score": 0.6992544300893859, "ground_truth": 0}, {"key": "33258866", "model": "llama", "target_model": "claude", "recognition_score": 0.5350984407870788, "ground_truth": 0}, {"key": "33258866", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5448013677145181, "ground_truth": 0}, {"key": "33258866", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5983121732297216, "ground_truth": 0}, {"key": "36962388", "model": "llama", "target_model": "llama", "recognition_score": 0.8766343842902586, "ground_truth": 1}, {"key": "36962388", "model": "llama", "target_model": "human", "recognition_score": 0.7248702878622553, "ground_truth": 0}, {"key": "36962388", "model": "llama", "target_model": "claude", "recognition_score": 0.8152324899213406, "ground_truth": 0}, {"key": "36962388", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7981867838574047, "ground_truth": 0}, {"key": "36962388", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8438951155351945, "ground_truth": 0}, {"key": "32282272", "model": "llama", "target_model": "llama", "recognition_score": 0.5136684875614546, "ground_truth": 1}, {"key": "32282272", "model": "llama", "target_model": "human", "recognition_score": 0.4339814589618265, "ground_truth": 0}, {"key": "32282272", "model": "llama", "target_model": "claude", "recognition_score": 0.6150878743632647, "ground_truth": 0}, {"key": "32282272", "model": "llama", "target_model": "gpt4", "recognition_score": 0.36116470470994666, "ground_truth": 0}, {"key": "32282272", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5292633887201129, "ground_truth": 0}, {"key": "36093072", "model": "llama", "target_model": "llama", "recognition_score": 0.9453993949325364, "ground_truth": 1}, {"key": "36093072", "model": "llama", "target_model": "human", "recognition_score": 0.9518632288166011, "ground_truth": 0}, {"key": "36093072", "model": "llama", "target_model": "claude", "recognition_score": 0.9079671317257538, "ground_truth": 0}, {"key": "36093072", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9539660931380382, "ground_truth": 0}, {"key": "36093072", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9445872074783254, "ground_truth": 0}, {"key": "38879972", "model": "llama", "target_model": "llama", "recognition_score": 0.7718435044090839, "ground_truth": 1}, {"key": "38879972", "model": "llama", "target_model": "human", "recognition_score": 0.754914978576768, "ground_truth": 0}, {"key": "38879972", "model": "llama", "target_model": "claude", "recognition_score": 0.6636689352455912, "ground_truth": 0}, {"key": "38879972", "model": "llama", "target_model": "gpt4", "recognition_score": 0.859663765051116, "ground_truth": 0}, {"key": "38879972", "model": "llama", "target_model": "gpt35", "recognition_score": 0.70416014694587, "ground_truth": 0}, {"key": "32106473", "model": "llama", "target_model": "llama", "recognition_score": 0.7122321850058974, "ground_truth": 1}, {"key": "32106473", "model": "llama", "target_model": "human", "recognition_score": 0.7185943916281122, "ground_truth": 0}, {"key": "32106473", "model": "llama", "target_model": "claude", "recognition_score": 0.8092759651392868, "ground_truth": 0}, {"key": "32106473", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8438951054385039, "ground_truth": 0}, {"key": "32106473", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7592253913990736, "ground_truth": 0}, {"key": "40415815", "model": "llama", "target_model": "llama", "recognition_score": 0.7295197734886439, "ground_truth": 1}, {"key": "40415815", "model": "llama", "target_model": "human", "recognition_score": 0.6388352786052836, "ground_truth": 0}, {"key": "40415815", "model": "llama", "target_model": "claude", "recognition_score": 0.5832033312319295, "ground_truth": 0}, {"key": "40415815", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4726834623497772, "ground_truth": 0}, {"key": "40415815", "model": "llama", "target_model": "gpt35", "recognition_score": 0.515619912920672, "ground_truth": 0}, {"key": "34581918", "model": "llama", "target_model": "llama", "recognition_score": 0.7325918301503095, "ground_truth": 1}, {"key": "34581918", "model": "llama", "target_model": "human", "recognition_score": 0.7431680179367717, "ground_truth": 0}, {"key": "34581918", "model": "llama", "target_model": "claude", "recognition_score": 0.7057850182109892, "ground_truth": 0}, {"key": "34581918", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7892336825622477, "ground_truth": 0}, {"key": "34581918", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8056321785881022, "ground_truth": 0}, {"key": "33004157", "model": "llama", "target_model": "llama", "recognition_score": 0.9343951680253969, "ground_truth": 1}, {"key": "33004157", "model": "llama", "target_model": "human", "recognition_score": 0.8289388226430914, "ground_truth": 0}, {"key": "33004157", "model": "llama", "target_model": "claude", "recognition_score": 0.8856314754271695, "ground_truth": 0}, {"key": "33004157", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8791467706751563, "ground_truth": 0}, {"key": "33004157", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9173026547426414, "ground_truth": 0}, {"key": "30334943", "model": "llama", "target_model": "llama", "recognition_score": 0.943763651285544, "ground_truth": 1}, {"key": "30334943", "model": "llama", "target_model": "human", "recognition_score": 0.9130583422486149, "ground_truth": 0}, {"key": "30334943", "model": "llama", "target_model": "claude", "recognition_score": 0.8519527913104884, "ground_truth": 0}, {"key": "30334943", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8152324757822316, "ground_truth": 0}, {"key": "30334943", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8643104703097341, "ground_truth": 0}, {"key": "33280503", "model": "llama", "target_model": "llama", "recognition_score": 0.39981163099527606, "ground_truth": 1}, {"key": "33280503", "model": "llama", "target_model": "human", "recognition_score": 0.46684559894414307, "ground_truth": 0}, {"key": "33280503", "model": "llama", "target_model": "claude", "recognition_score": 0.45519861372552906, "ground_truth": 0}, {"key": "33280503", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3575675155059613, "ground_truth": 0}, {"key": "33280503", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4263215913599255, "ground_truth": 0}, {"key": "25726782", "model": "llama", "target_model": "llama", "recognition_score": 0.9462003523650279, "ground_truth": 1}, {"key": "25726782", "model": "llama", "target_model": "human", "recognition_score": 0.8529354937455348, "ground_truth": 0}, {"key": "25726782", "model": "llama", "target_model": "claude", "recognition_score": 0.9492946387026931, "ground_truth": 0}, {"key": "25726782", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9473810472771896, "ground_truth": 0}, {"key": "25726782", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9394706059710781, "ground_truth": 0}, {"key": "35479854", "model": "llama", "target_model": "llama", "recognition_score": 0.7057850248898029, "ground_truth": 1}, {"key": "35479854", "model": "llama", "target_model": "human", "recognition_score": 0.6548947303385635, "ground_truth": 0}, {"key": "35479854", "model": "llama", "target_model": "claude", "recognition_score": 0.7853085937309383, "ground_truth": 0}, {"key": "35479854", "model": "llama", "target_model": "gpt4", "recognition_score": 0.902609599669235, "ground_truth": 0}, {"key": "35479854", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7943849512304731, "ground_truth": 0}, {"key": "32716226", "model": "llama", "target_model": "llama", "recognition_score": 0.6740504735927563, "ground_truth": 1}, {"key": "32716226", "model": "llama", "target_model": "human", "recognition_score": 0.8278281504237683, "ground_truth": 0}, {"key": "32716226", "model": "llama", "target_model": "claude", "recognition_score": 0.7549149918412571, "ground_truth": 0}, {"key": "32716226", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7217432423318012, "ground_truth": 0}, {"key": "32716226", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8652240766744832, "ground_truth": 0}, {"key": "37047554", "model": "llama", "target_model": "llama", "recognition_score": 0.46101679382394933, "ground_truth": 1}, {"key": "37047554", "model": "llama", "target_model": "human", "recognition_score": 0.5736784047970279, "ground_truth": 0}, {"key": "37047554", "model": "llama", "target_model": "claude", "recognition_score": 0.8376199683854145, "ground_truth": 0}, {"key": "37047554", "model": "llama", "target_model": "gpt4", "recognition_score": 0.30902370088525477, "ground_truth": 0}, {"key": "37047554", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7386690626227167, "ground_truth": 0}, {"key": "36565290", "model": "llama", "target_model": "llama", "recognition_score": 0.9309620650080223, "ground_truth": 1}, {"key": "36565290", "model": "llama", "target_model": "human", "recognition_score": 0.9420819168165858, "ground_truth": 0}, {"key": "36565290", "model": "llama", "target_model": "claude", "recognition_score": 0.9563089406384733, "ground_truth": 0}, {"key": "36565290", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9394706139933143, "ground_truth": 0}, {"key": "36565290", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9507778860910188, "ground_truth": 0}, {"key": "27758640", "model": "llama", "target_model": "llama", "recognition_score": 0.831143056018379, "ground_truth": 1}, {"key": "27758640", "model": "llama", "target_model": "human", "recognition_score": 0.7732163664272538, "ground_truth": 0}, {"key": "27758640", "model": "llama", "target_model": "claude", "recognition_score": 0.9433475784258756, "ground_truth": 0}, {"key": "27758640", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8221891353738253, "ground_truth": 0}, {"key": "27758640", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8714748595892743, "ground_truth": 0}, {"key": "28897118", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819567059016, "ground_truth": 1}, {"key": "28897118", "model": "llama", "target_model": "human", "recognition_score": 0.7401743501449426, "ground_truth": 0}, {"key": "28897118", "model": "llama", "target_model": "claude", "recognition_score": 0.7905303240874934, "ground_truth": 0}, {"key": "28897118", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7813306041198287, "ground_truth": 0}, {"key": "28897118", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5813031025800955, "ground_truth": 0}, {"key": "38452661", "model": "llama", "target_model": "llama", "recognition_score": 0.9606574980272221, "ground_truth": 1}, {"key": "38452661", "model": "llama", "target_model": "human", "recognition_score": 0.9539660930167296, "ground_truth": 0}, {"key": "38452661", "model": "llama", "target_model": "claude", "recognition_score": 0.9314625049059772, "ground_truth": 0}, {"key": "38452661", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8210441177297131, "ground_truth": 0}, {"key": "38452661", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8596637737316477, "ground_truth": 0}, {"key": "38033492", "model": "llama", "target_model": "llama", "recognition_score": 0.8697145817191203, "ground_truth": 1}, {"key": "38033492", "model": "llama", "target_model": "human", "recognition_score": 0.8652240836944379, "ground_truth": 0}, {"key": "38033492", "model": "llama", "target_model": "claude", "recognition_score": 0.9257686364453296, "ground_truth": 0}, {"key": "38033492", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8152324959572732, "ground_truth": 0}, {"key": "38033492", "model": "llama", "target_model": "gpt35", "recognition_score": 0.931959577450012, "ground_truth": 0}, {"key": "35949555", "model": "llama", "target_model": "llama", "recognition_score": 0.9358173586513846, "ground_truth": 1}, {"key": "35949555", "model": "llama", "target_model": "human", "recognition_score": 0.9314625036773213, "ground_truth": 0}, {"key": "35949555", "model": "llama", "target_model": "claude", "recognition_score": 0.9437636558030084, "ground_truth": 0}, {"key": "35949555", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8984105577483521, "ground_truth": 0}, {"key": "35949555", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9367494785227867, "ground_truth": 0}, {"key": "15263826", "model": "llama", "target_model": "llama", "recognition_score": 0.687630034591785, "ground_truth": 1}, {"key": "15263826", "model": "llama", "target_model": "human", "recognition_score": 0.4205995539301398, "ground_truth": 0}, {"key": "15263826", "model": "llama", "target_model": "claude", "recognition_score": 0.7138307676606868, "ground_truth": 0}, {"key": "15263826", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6442251093074998, "ground_truth": 0}, {"key": "15263826", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6076631561544975, "ground_truth": 0}, {"key": "37313866", "model": "llama", "target_model": "llama", "recognition_score": 0.9314625049586609, "ground_truth": 1}, {"key": "37313866", "model": "llama", "target_model": "human", "recognition_score": 0.6477982499363165, "ground_truth": 0}, {"key": "37313866", "model": "llama", "target_model": "claude", "recognition_score": 0.8092759898094904, "ground_truth": 0}, {"key": "37313866", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7994423172931346, "ground_truth": 0}, {"key": "37313866", "model": "llama", "target_model": "gpt35", "recognition_score": 0.750552756413976, "ground_truth": 0}, {"key": "13911157", "model": "llama", "target_model": "llama", "recognition_score": 0.9518632286389433, "ground_truth": 1}, {"key": "13911157", "model": "llama", "target_model": "human", "recognition_score": 0.9885803865865599, "ground_truth": 0}, {"key": "13911157", "model": "llama", "target_model": "claude", "recognition_score": 0.967410255638733, "ground_truth": 0}, {"key": "13911157", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9683812334034856, "ground_truth": 0}, {"key": "13911157", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9575961717164774, "ground_truth": 0}, {"key": "39594894", "model": "llama", "target_model": "llama", "recognition_score": 0.7154239918482526, "ground_truth": 1}, {"key": "39594894", "model": "llama", "target_model": "human", "recognition_score": 0.8386797629215896, "ground_truth": 0}, {"key": "39594894", "model": "llama", "target_model": "claude", "recognition_score": 0.45132650125591134, "ground_truth": 0}, {"key": "39594894", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8116760184245899, "ground_truth": 0}, {"key": "39594894", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8198933539128385, "ground_truth": 0}, {"key": "34096170", "model": "llama", "target_model": "llama", "recognition_score": 0.9039745180296166, "ground_truth": 1}, {"key": "34096170", "model": "llama", "target_model": "human", "recognition_score": 0.8962513704350676, "ground_truth": 0}, {"key": "34096170", "model": "llama", "target_model": "claude", "recognition_score": 0.9263037316295913, "ground_truth": 0}, {"key": "34096170", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7662936465008293, "ground_truth": 0}, {"key": "34096170", "model": "llama", "target_model": "gpt35", "recognition_score": 0.85096471300778, "ground_truth": 0}, {"key": "37891952", "model": "llama", "target_model": "llama", "recognition_score": 0.9887554394533702, "ground_truth": 1}, {"key": "37891952", "model": "llama", "target_model": "human", "recognition_score": 0.9910838730469732, "ground_truth": 0}, {"key": "37891952", "model": "llama", "target_model": "claude", "recognition_score": 0.9933588883605159, "ground_truth": 0}, {"key": "37891952", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9862576800029408, "ground_truth": 0}, {"key": "37891952", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9929882052155007, "ground_truth": 0}, {"key": "40186158", "model": "llama", "target_model": "llama", "recognition_score": 0.741674013577275, "ground_truth": 1}, {"key": "40186158", "model": "llama", "target_model": "human", "recognition_score": 0.631594311255293, "ground_truth": 0}, {"key": "40186158", "model": "llama", "target_model": "claude", "recognition_score": 0.7563575699321177, "ground_truth": 0}, {"key": "40186158", "model": "llama", "target_model": "gpt4", "recognition_score": 0.575588038438418, "ground_truth": 0}, {"key": "40186158", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6242935058241209, "ground_truth": 0}, {"key": "37049719", "model": "llama", "target_model": "llama", "recognition_score": 0.8757869759121353, "ground_truth": 1}, {"key": "37049719", "model": "llama", "target_model": "human", "recognition_score": 0.7759445468200813, "ground_truth": 0}, {"key": "37049719", "model": "llama", "target_model": "claude", "recognition_score": 0.8643104594250898, "ground_truth": 0}, {"key": "37049719", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7826624708983909, "ground_truth": 0}, {"key": "37049719", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6808786189335568, "ground_truth": 0}, {"key": "34610504", "model": "llama", "target_model": "llama", "recognition_score": 0.9213576199100706, "ground_truth": 1}, {"key": "34610504", "model": "llama", "target_model": "human", "recognition_score": 0.8210441105185272, "ground_truth": 0}, {"key": "34610504", "model": "llama", "target_model": "claude", "recognition_score": 0.8019358201698863, "ground_truth": 0}, {"key": "34610504", "model": "llama", "target_model": "gpt4", "recognition_score": 0.868826778864861, "ground_truth": 0}, {"key": "34610504", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8407825787564395, "ground_truth": 0}, {"key": "37595429", "model": "llama", "target_model": "llama", "recognition_score": 0.9099069959957508, "ground_truth": 1}, {"key": "37595429", "model": "llama", "target_model": "human", "recognition_score": 0.8386797428592045, "ground_truth": 0}, {"key": "37595429", "model": "llama", "target_model": "claude", "recognition_score": 0.8322366627841362, "ground_truth": 0}, {"key": "37595429", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8469578221440398, "ground_truth": 0}, {"key": "37595429", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7676898612418698, "ground_truth": 0}, {"key": "29772670", "model": "llama", "target_model": "llama", "recognition_score": 0.3090237129983168, "ground_truth": 1}, {"key": "29772670", "model": "llama", "target_model": "human", "recognition_score": 0.5851011586741326, "ground_truth": 0}, {"key": "29772670", "model": "llama", "target_model": "claude", "recognition_score": 0.7041601398161667, "ground_truth": 0}, {"key": "29772670", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6859494478833743, "ground_truth": 0}, {"key": "29772670", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5926665762805445, "ground_truth": 0}, {"key": "36369872", "model": "llama", "target_model": "llama", "recognition_score": 0.8947894695116354, "ground_truth": 1}, {"key": "36369872", "model": "llama", "target_model": "human", "recognition_score": 0.602061592084887, "ground_truth": 0}, {"key": "36369872", "model": "llama", "target_model": "claude", "recognition_score": 0.7505527472292995, "ground_truth": 0}, {"key": "36369872", "model": "llama", "target_model": "gpt4", "recognition_score": 0.79310596962297, "ground_truth": 0}, {"key": "36369872", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8661325158366335, "ground_truth": 0}, {"key": "34527433", "model": "llama", "target_model": "llama", "recognition_score": 0.6477981944234243, "ground_truth": 1}, {"key": "34527433", "model": "llama", "target_model": "human", "recognition_score": 0.5506073572494956, "ground_truth": 0}, {"key": "34527433", "model": "llama", "target_model": "claude", "recognition_score": 0.5350984358761965, "ground_truth": 0}, {"key": "34527433", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5117165756436627, "ground_truth": 0}, {"key": "34527433", "model": "llama", "target_model": "gpt35", "recognition_score": 0.620621625400053, "ground_truth": 0}, {"key": "31111734", "model": "llama", "target_model": "llama", "recognition_score": 0.8902942308525186, "ground_truth": 1}, {"key": "31111734", "model": "llama", "target_model": "human", "recognition_score": 0.808067211234663, "ground_truth": 0}, {"key": "31111734", "model": "llama", "target_model": "claude", "recognition_score": 0.8577681044438297, "ground_truth": 0}, {"key": "31111734", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8596637407443355, "ground_truth": 0}, {"key": "31111734", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8991213830612287, "ground_truth": 0}, {"key": "40303872", "model": "llama", "target_model": "llama", "recognition_score": 0.8732148221072568, "ground_truth": 1}, {"key": "40303872", "model": "llama", "target_model": "human", "recognition_score": 0.8670357619827784, "ground_truth": 0}, {"key": "40303872", "model": "llama", "target_model": "claude", "recognition_score": 0.8783142561619005, "ground_truth": 0}, {"key": "40303872", "model": "llama", "target_model": "gpt4", "recognition_score": 0.85195278945854, "ground_truth": 0}, {"key": "40303872", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8354835335217059, "ground_truth": 0}, {"key": "33653553", "model": "llama", "target_model": "llama", "recognition_score": 0.5389832147331887, "ground_truth": 1}, {"key": "33653553", "model": "llama", "target_model": "human", "recognition_score": 0.5660185220352811, "ground_truth": 0}, {"key": "33653553", "model": "llama", "target_model": "claude", "recognition_score": 0.585101134585366, "ground_truth": 0}, {"key": "33653553", "model": "llama", "target_model": "gpt4", "recognition_score": 0.38491214648975036, "ground_truth": 0}, {"key": "33653553", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5563995940286272, "ground_truth": 0}, {"key": "34404510", "model": "llama", "target_model": "llama", "recognition_score": 0.7918210650105594, "ground_truth": 1}, {"key": "34404510", "model": "llama", "target_model": "human", "recognition_score": 0.7264256088895542, "ground_truth": 0}, {"key": "34404510", "model": "llama", "target_model": "claude", "recognition_score": 0.8289387865379505, "ground_truth": 0}, {"key": "34404510", "model": "llama", "target_model": "gpt4", "recognition_score": 0.890294219991533, "ground_truth": 0}, {"key": "34404510", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8428631575238646, "ground_truth": 0}, {"key": "35568692", "model": "llama", "target_model": "llama", "recognition_score": 0.24944723188980955, "ground_truth": 1}, {"key": "35568692", "model": "llama", "target_model": "human", "recognition_score": 0.20307464304174694, "ground_truth": 0}, {"key": "35568692", "model": "llama", "target_model": "claude", "recognition_score": 0.2845760046987381, "ground_truth": 0}, {"key": "35568692", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2674081701478478, "ground_truth": 0}, {"key": "35568692", "model": "llama", "target_model": "gpt35", "recognition_score": 0.29259529131347095, "ground_truth": 0}, {"key": "39151664", "model": "llama", "target_model": "llama", "recognition_score": 0.35398626271208894, "ground_truth": 1}, {"key": "39151664", "model": "llama", "target_model": "human", "recognition_score": 0.44167299461887455, "ground_truth": 0}, {"key": "39151664", "model": "llama", "target_model": "claude", "recognition_score": 0.3702253640535171, "ground_truth": 0}, {"key": "39151664", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6460136934483768, "ground_truth": 0}, {"key": "39151664", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6150878325995497, "ground_truth": 0}, {"key": "37493670", "model": "llama", "target_model": "llama", "recognition_score": 0.9963783147944585, "ground_truth": 1}, {"key": "37493670", "model": "llama", "target_model": "human", "recognition_score": 0.9976218766613144, "ground_truth": 0}, {"key": "37493670", "model": "llama", "target_model": "claude", "recognition_score": 0.9939496023509267, "ground_truth": 0}, {"key": "37493670", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9951702778011291, "ground_truth": 0}, {"key": "37493670", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9957020615587087, "ground_truth": 0}, {"key": "21935983", "model": "llama", "target_model": "llama", "recognition_score": 0.5292633889358369, "ground_truth": 1}, {"key": "21935983", "model": "llama", "target_model": "human", "recognition_score": 0.4301473289163134, "ground_truth": 0}, {"key": "21935983", "model": "llama", "target_model": "claude", "recognition_score": 0.44939261895561766, "ground_truth": 0}, {"key": "21935983", "model": "llama", "target_model": "gpt4", "recognition_score": 0.29746994191203513, "ground_truth": 0}, {"key": "21935983", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4148988428410314, "ground_truth": 0}, {"key": "38174214", "model": "llama", "target_model": "llama", "recognition_score": 0.8449215261841566, "ground_truth": 1}, {"key": "38174214", "model": "llama", "target_model": "human", "recognition_score": 0.8925625213983575, "ground_truth": 0}, {"key": "38174214", "model": "llama", "target_model": "claude", "recognition_score": 0.8633916026495679, "ground_truth": 0}, {"key": "38174214", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9348724467756085, "ground_truth": 0}, {"key": "38174214", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8164063869642785, "ground_truth": 0}, {"key": "40319923", "model": "llama", "target_model": "llama", "recognition_score": 0.9241418124078083, "ground_truth": 1}, {"key": "40319923", "model": "llama", "target_model": "human", "recognition_score": 0.9775429482232838, "ground_truth": 0}, {"key": "40319923", "model": "llama", "target_model": "claude", "recognition_score": 0.9492946329633751, "ground_truth": 0}, {"key": "40319923", "model": "llama", "target_model": "gpt4", "recognition_score": 0.930962070979372, "ground_truth": 0}, {"key": "40319923", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9420819102354717, "ground_truth": 0}, {"key": "36478264", "model": "llama", "target_model": "llama", "recognition_score": 0.8418256481950809, "ground_truth": 1}, {"key": "36478264", "model": "llama", "target_model": "human", "recognition_score": 0.8140528185481248, "ground_truth": 0}, {"key": "36478264", "model": "llama", "target_model": "claude", "recognition_score": 0.884837756109288, "ground_truth": 0}, {"key": "36478264", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8449215398395616, "ground_truth": 0}, {"key": "36478264", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8529354931382107, "ground_truth": 0}, {"key": "11935769", "model": "llama", "target_model": "llama", "recognition_score": 0.7041601447057069, "ground_truth": 1}, {"key": "11935769", "model": "llama", "target_model": "human", "recognition_score": 0.7799928943982769, "ground_truth": 0}, {"key": "11935769", "model": "llama", "target_model": "claude", "recognition_score": 0.6706082621891185, "ground_truth": 0}, {"key": "11935769", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8365545564409925, "ground_truth": 0}, {"key": "11935769", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8459424475547205, "ground_truth": 0}, {"key": "33373410", "model": "llama", "target_model": "llama", "recognition_score": 0.4092207849846268, "ground_truth": 1}, {"key": "33373410", "model": "llama", "target_model": "human", "recognition_score": 0.3557748892220617, "ground_truth": 0}, {"key": "33373410", "model": "llama", "target_model": "claude", "recognition_score": 0.40922079329989725, "ground_truth": 0}, {"key": "33373410", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5039061521615258, "ground_truth": 0}, {"key": "33373410", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3684057174473725, "ground_truth": 0}, {"key": "11130680", "model": "llama", "target_model": "llama", "recognition_score": 0.8044059162260301, "ground_truth": 1}, {"key": "11130680", "model": "llama", "target_model": "human", "recognition_score": 0.9273632906473536, "ground_truth": 0}, {"key": "11130680", "model": "llama", "target_model": "claude", "recognition_score": 0.6242935310637857, "ground_truth": 0}, {"key": "11130680", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9343951624200579, "ground_truth": 0}, {"key": "11130680", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8615382092295867, "ground_truth": 0}, {"key": "34868650", "model": "llama", "target_model": "llama", "recognition_score": 0.8832359894048772, "ground_truth": 1}, {"key": "34868650", "model": "llama", "target_model": "human", "recognition_score": 0.6315943037030151, "ground_truth": 0}, {"key": "34868650", "model": "llama", "target_model": "claude", "recognition_score": 0.8596637580464385, "ground_truth": 0}, {"key": "34868650", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7577943756707582, "ground_truth": 0}, {"key": "34868650", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9124361580078967, "ground_truth": 0}, {"key": "33960561", "model": "llama", "target_model": "llama", "recognition_score": 0.7826624920720137, "ground_truth": 1}, {"key": "33960561", "model": "llama", "target_model": "human", "recognition_score": 0.5078118622413583, "ground_truth": 0}, {"key": "33960561", "model": "llama", "target_model": "claude", "recognition_score": 0.7386690793569918, "ground_truth": 0}, {"key": "33960561", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7732163727376337, "ground_truth": 0}, {"key": "33960561", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7786493368434696, "ground_truth": 0}, {"key": "22504858", "model": "llama", "target_model": "llama", "recognition_score": 0.7905302968149635, "ground_truth": 1}, {"key": "22504858", "model": "llama", "target_model": "human", "recognition_score": 0.8749346299186241, "ground_truth": 0}, {"key": "22504858", "model": "llama", "target_model": "claude", "recognition_score": 0.888758786580436, "ground_truth": 0}, {"key": "22504858", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8783142442130489, "ground_truth": 0}, {"key": "22504858", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6370307751592968, "ground_truth": 0}, {"key": "32283530", "model": "llama", "target_model": "llama", "recognition_score": 0.856812296235201, "ground_truth": 1}, {"key": "32283530", "model": "llama", "target_model": "human", "recognition_score": 0.8056321704237815, "ground_truth": 0}, {"key": "32283530", "model": "llama", "target_model": "claude", "recognition_score": 0.8459424273527959, "ground_truth": 0}, {"key": "32283530", "model": "llama", "target_model": "gpt4", "recognition_score": 0.852935482317576, "ground_truth": 0}, {"key": "32283530", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8311430364505444, "ground_truth": 0}, {"key": "38377099", "model": "llama", "target_model": "llama", "recognition_score": 0.9053222984231882, "ground_truth": 1}, {"key": "38377099", "model": "llama", "target_model": "human", "recognition_score": 0.8895288505856928, "ground_truth": 0}, {"key": "38377099", "model": "llama", "target_model": "claude", "recognition_score": 0.8732148315005807, "ground_truth": 0}, {"key": "38377099", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9629528326008046, "ground_truth": 0}, {"key": "38377099", "model": "llama", "target_model": "gpt35", "recognition_score": 0.901227419389939, "ground_truth": 0}, {"key": "36105123", "model": "llama", "target_model": "llama", "recognition_score": 0.9416541580704656, "ground_truth": 1}, {"key": "36105123", "model": "llama", "target_model": "human", "recognition_score": 0.9615338086387561, "ground_truth": 0}, {"key": "36105123", "model": "llama", "target_model": "claude", "recognition_score": 0.9777138157321291, "ground_truth": 0}, {"key": "36105123", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9645892726868729, "ground_truth": 0}, {"key": "36105123", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9582261183682348, "ground_truth": 0}, {"key": "33527826", "model": "llama", "target_model": "llama", "recognition_score": 0.8991213713657725, "ground_truth": 1}, {"key": "33527826", "model": "llama", "target_model": "human", "recognition_score": 0.9319595818713103, "ground_truth": 0}, {"key": "33527826", "model": "llama", "target_model": "claude", "recognition_score": 0.8688267910938949, "ground_truth": 0}, {"key": "33527826", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9403530598515116, "ground_truth": 0}, {"key": "33527826", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9572778060889153, "ground_truth": 0}, {"key": "32349891", "model": "llama", "target_model": "llama", "recognition_score": 0.8489721847726983, "ground_truth": 1}, {"key": "32349891", "model": "llama", "target_model": "human", "recognition_score": 0.8679338441689888, "ground_truth": 0}, {"key": "32349891", "model": "llama", "target_model": "claude", "recognition_score": 0.8879840456583324, "ground_truth": 0}, {"key": "32349891", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8652240766661858, "ground_truth": 0}, {"key": "32349891", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8459424352103783, "ground_truth": 0}, {"key": "34281974", "model": "llama", "target_model": "llama", "recognition_score": 0.8152324749631218, "ground_truth": 1}, {"key": "34281974", "model": "llama", "target_model": "human", "recognition_score": 0.6740504797872231, "ground_truth": 0}, {"key": "34281974", "model": "llama", "target_model": "claude", "recognition_score": 0.8116760394449016, "ground_truth": 0}, {"key": "34281974", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6943026707750729, "ground_truth": 0}, {"key": "34281974", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7248702804972942, "ground_truth": 0}, {"key": "29387866", "model": "llama", "target_model": "llama", "recognition_score": 0.5292634144373719, "ground_truth": 1}, {"key": "29387866", "model": "llama", "target_model": "human", "recognition_score": 0.5640984995480038, "ground_truth": 0}, {"key": "29387866", "model": "llama", "target_model": "claude", "recognition_score": 0.6548947286935428, "ground_truth": 0}, {"key": "29387866", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4765796765924075, "ground_truth": 0}, {"key": "29387866", "model": "llama", "target_model": "gpt35", "recognition_score": 0.527316520567378, "ground_truth": 0}, {"key": "35731925", "model": "llama", "target_model": "llama", "recognition_score": 0.9872772905311374, "ground_truth": 1}, {"key": "35731925", "model": "llama", "target_model": "human", "recognition_score": 0.9924227590591087, "ground_truth": 0}, {"key": "35731925", "model": "llama", "target_model": "claude", "recognition_score": 0.9871787856282629, "ground_truth": 0}, {"key": "35731925", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9884026384754805, "ground_truth": 0}, {"key": "35731925", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9875683494730985, "ground_truth": 0}, {"key": "38829733", "model": "llama", "target_model": "llama", "recognition_score": 0.8449215167814532, "ground_truth": 1}, {"key": "38829733", "model": "llama", "target_model": "human", "recognition_score": 0.8962513686277538, "ground_truth": 0}, {"key": "38829733", "model": "llama", "target_model": "claude", "recognition_score": 0.8840392825174195, "ground_truth": 0}, {"key": "38829733", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8925625145415418, "ground_truth": 0}, {"key": "38829733", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9005297862752424, "ground_truth": 0}, {"key": "24624736", "model": "llama", "target_model": "llama", "recognition_score": 0.9161096124811553, "ground_truth": 1}, {"key": "24624736", "model": "llama", "target_model": "human", "recognition_score": 0.9348724534511054, "ground_truth": 0}, {"key": "24624736", "model": "llama", "target_model": "claude", "recognition_score": 0.9376689640904157, "ground_truth": 0}, {"key": "24624736", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8955226797685032, "ground_truth": 0}, {"key": "24624736", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9059898123684821, "ground_truth": 0}, {"key": "36928562", "model": "llama", "target_model": "llama", "recognition_score": 0.9761291625852301, "ground_truth": 1}, {"key": "36928562", "model": "llama", "target_model": "human", "recognition_score": 0.9810219633679125, "ground_truth": 0}, {"key": "36928562", "model": "llama", "target_model": "claude", "recognition_score": 0.9609517032298045, "ground_truth": 0}, {"key": "36928562", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9918120899511637, "ground_truth": 0}, {"key": "36928562", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9822877003208215, "ground_truth": 0}, {"key": "34941119", "model": "llama", "target_model": "llama", "recognition_score": 0.7534666558676251, "ground_truth": 1}, {"key": "34941119", "model": "llama", "target_model": "human", "recognition_score": 0.5058591064886846, "ground_truth": 0}, {"key": "34941119", "model": "llama", "target_model": "claude", "recognition_score": 0.6859494716536716, "ground_truth": 0}, {"key": "34941119", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7356416442315863, "ground_truth": 0}, {"key": "34941119", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7310585783244837, "ground_truth": 0}, {"key": "30206231", "model": "llama", "target_model": "llama", "recognition_score": 0.5583270068690254, "ground_truth": 1}, {"key": "30206231", "model": "llama", "target_model": "human", "recognition_score": 0.6039318202894087, "ground_truth": 0}, {"key": "30206231", "model": "llama", "target_model": "claude", "recognition_score": 0.4282333689237553, "ground_truth": 0}, {"key": "30206231", "model": "llama", "target_model": "gpt4", "recognition_score": 0.679178685126686, "ground_truth": 0}, {"key": "30206231", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5907792160331065, "ground_truth": 0}, {"key": "35584972", "model": "llama", "target_model": "llama", "recognition_score": 0.6495785935161136, "ground_truth": 1}, {"key": "35584972", "model": "llama", "target_model": "human", "recognition_score": 0.8749346197415263, "ground_truth": 0}, {"key": "35584972", "model": "llama", "target_model": "claude", "recognition_score": 0.38861804240395476, "ground_truth": 0}, {"key": "35584972", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5506073909109028, "ground_truth": 0}, {"key": "35584972", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6791787103860452, "ground_truth": 0}, {"key": "39277709", "model": "llama", "target_model": "llama", "recognition_score": 0.9394706096976493, "ground_truth": 1}, {"key": "39277709", "model": "llama", "target_model": "human", "recognition_score": 0.9757623663449605, "ground_truth": 0}, {"key": "39277709", "model": "llama", "target_model": "claude", "recognition_score": 0.9697854145288372, "ground_truth": 0}, {"key": "39277709", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9559813582654021, "ground_truth": 0}, {"key": "39277709", "model": "llama", "target_model": "gpt35", "recognition_score": 0.970013491771385, "ground_truth": 0}, {"key": "36123657", "model": "llama", "target_model": "llama", "recognition_score": 0.9130583509317642, "ground_truth": 1}, {"key": "36123657", "model": "llama", "target_model": "human", "recognition_score": 0.9235923262430163, "ground_truth": 0}, {"key": "36123657", "model": "llama", "target_model": "claude", "recognition_score": 0.9372107915614664, "ground_truth": 0}, {"key": "36123657", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8679338427126743, "ground_truth": 0}, {"key": "36123657", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8344069001765478, "ground_truth": 0}, {"key": "33363938", "model": "llama", "target_model": "llama", "recognition_score": 0.9005297814696915, "ground_truth": 1}, {"key": "33363938", "model": "llama", "target_model": "human", "recognition_score": 0.5794003945552088, "ground_truth": 0}, {"key": "33363938", "model": "llama", "target_model": "claude", "recognition_score": 0.8840392790996487, "ground_truth": 0}, {"key": "33363938", "model": "llama", "target_model": "gpt4", "recognition_score": 0.90397450876853, "ground_truth": 0}, {"key": "33363938", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9728307648045098, "ground_truth": 0}, {"key": "37349129", "model": "llama", "target_model": "llama", "recognition_score": 0.8267118159249368, "ground_truth": 1}, {"key": "37349129", "model": "llama", "target_model": "human", "recognition_score": 0.5117166104127822, "ground_truth": 0}, {"key": "37349129", "model": "llama", "target_model": "claude", "recognition_score": 0.8568122980966865, "ground_truth": 0}, {"key": "37349129", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8587185820630188, "ground_truth": 0}, {"key": "37349129", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7634837968713076, "ground_truth": 0}, {"key": "37160199", "model": "llama", "target_model": "llama", "recognition_score": 0.7476159646528412, "ground_truth": 1}, {"key": "37160199", "model": "llama", "target_model": "human", "recognition_score": 0.5097643649861049, "ground_truth": 0}, {"key": "37160199", "model": "llama", "target_model": "claude", "recognition_score": 0.46684558834117207, "ground_truth": 0}, {"key": "37160199", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5058590953436859, "ground_truth": 0}, {"key": "37160199", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4941408818368025, "ground_truth": 0}, {"key": "35891053", "model": "llama", "target_model": "llama", "recognition_score": 0.9196425302066429, "ground_truth": 1}, {"key": "35891053", "model": "llama", "target_model": "human", "recognition_score": 0.9372107970330666, "ground_truth": 0}, {"key": "35891053", "model": "llama", "target_model": "claude", "recognition_score": 0.8856314652928882, "ground_truth": 0}, {"key": "35891053", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9026096022384287, "ground_truth": 0}, {"key": "35891053", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9230391717789912, "ground_truth": 0}, {"key": "40694542", "model": "llama", "target_model": "llama", "recognition_score": 0.7008947951802331, "ground_truth": 1}, {"key": "40694542", "model": "llama", "target_model": "human", "recognition_score": 0.6688802635189677, "ground_truth": 0}, {"key": "40694542", "model": "llama", "target_model": "claude", "recognition_score": 0.7310585770103353, "ground_truth": 0}, {"key": "40694542", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6584175019470786, "ground_truth": 0}, {"key": "40694542", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5774953357481133, "ground_truth": 0}, {"key": "24645770", "model": "llama", "target_model": "llama", "recognition_score": 0.740174368430911, "ground_truth": 1}, {"key": "24645770", "model": "llama", "target_model": "human", "recognition_score": 0.8267117960245728, "ground_truth": 0}, {"key": "24645770", "model": "llama", "target_model": "claude", "recognition_score": 0.9167080727910986, "ground_truth": 0}, {"key": "24645770", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8984105496655155, "ground_truth": 0}, {"key": "24645770", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8289388224290205, "ground_truth": 0}, {"key": "37974587", "model": "llama", "target_model": "llama", "recognition_score": 0.9588471137532872, "ground_truth": 1}, {"key": "37974587", "model": "llama", "target_model": "human", "recognition_score": 0.94659666697036, "ground_truth": 0}, {"key": "37974587", "model": "llama", "target_model": "claude", "recognition_score": 0.9612438051109329, "ground_truth": 0}, {"key": "37974587", "model": "llama", "target_model": "gpt4", "recognition_score": 0.94499470864311, "ground_truth": 0}, {"key": "37974587", "model": "llama", "target_model": "gpt35", "recognition_score": 0.90665312229001, "ground_truth": 0}, {"key": "40354149", "model": "llama", "target_model": "llama", "recognition_score": 0.8864204025557338, "ground_truth": 1}, {"key": "40354149", "model": "llama", "target_model": "human", "recognition_score": 0.7008947838148485, "ground_truth": 0}, {"key": "40354149", "model": "llama", "target_model": "claude", "recognition_score": 0.8479677623710811, "ground_truth": 0}, {"key": "40354149", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8376199584429617, "ground_truth": 0}, {"key": "40354149", "model": "llama", "target_model": "gpt35", "recognition_score": 0.856812310590377, "ground_truth": 0}, {"key": "35519470", "model": "llama", "target_model": "llama", "recognition_score": 0.5409238649390956, "ground_truth": 1}, {"key": "35519470", "model": "llama", "target_model": "human", "recognition_score": 0.5428632861085625, "ground_truth": 0}, {"key": "35519470", "model": "llama", "target_model": "claude", "recognition_score": 0.4301473581948581, "ground_truth": 0}, {"key": "35519470", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3849121536686458, "ground_truth": 0}, {"key": "35519470", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5273165278242156, "ground_truth": 0}, {"key": "36185624", "model": "llama", "target_model": "llama", "recognition_score": 0.9012274199140207, "ground_truth": 1}, {"key": "36185624", "model": "llama", "target_model": "human", "recognition_score": 0.8902942184198609, "ground_truth": 0}, {"key": "36185624", "model": "llama", "target_model": "claude", "recognition_score": 0.9686195703917483, "ground_truth": 0}, {"key": "36185624", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9149009415718704, "ground_truth": 0}, {"key": "36185624", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9039745141701729, "ground_truth": 0}, {"key": "39306113", "model": "llama", "target_model": "llama", "recognition_score": 0.540923859206797, "ground_truth": 1}, {"key": "39306113", "model": "llama", "target_model": "human", "recognition_score": 0.4571366994271236, "ground_truth": 0}, {"key": "39306113", "model": "llama", "target_model": "claude", "recognition_score": 0.4824291114249643, "ground_truth": 0}, {"key": "39306113", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5253688158182793, "ground_truth": 0}, {"key": "39306113", "model": "llama", "target_model": "gpt35", "recognition_score": 0.23510838958802474, "ground_truth": 0}, {"key": "19347718", "model": "llama", "target_model": "llama", "recognition_score": 0.7905303320103124, "ground_truth": 1}, {"key": "19347718", "model": "llama", "target_model": "human", "recognition_score": 0.7592254060821914, "ground_truth": 0}, {"key": "19347718", "model": "llama", "target_model": "claude", "recognition_score": 0.8344068903748041, "ground_truth": 0}, {"key": "19347718", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7799929110937568, "ground_truth": 0}, {"key": "19347718", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8198933318137067, "ground_truth": 0}, {"key": "21870064", "model": "llama", "target_model": "llama", "recognition_score": 0.7138307446909881, "ground_truth": 1}, {"key": "21870064", "model": "llama", "target_model": "human", "recognition_score": 0.5292633751500034, "ground_truth": 0}, {"key": "21870064", "model": "llama", "target_model": "claude", "recognition_score": 0.6001883653919765, "ground_truth": 0}, {"key": "21870064", "model": "llama", "target_model": "gpt4", "recognition_score": 0.613236553897909, "ground_truth": 0}, {"key": "21870064", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7090191122376883, "ground_truth": 0}, {"key": "37675776", "model": "llama", "target_model": "llama", "recognition_score": 0.9648551491325206, "ground_truth": 1}, {"key": "37675776", "model": "llama", "target_model": "human", "recognition_score": 0.9591542830117885, "ground_truth": 0}, {"key": "37675776", "model": "llama", "target_model": "claude", "recognition_score": 0.9324533105835744, "ground_truth": 0}, {"key": "37675776", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9294404094847386, "ground_truth": 0}, {"key": "37675776", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9603611602738686, "ground_truth": 0}, {"key": "38107017", "model": "llama", "target_model": "llama", "recognition_score": 0.7981867772150923, "ground_truth": 1}, {"key": "38107017", "model": "llama", "target_model": "human", "recognition_score": 0.7931059493247246, "ground_truth": 0}, {"key": "38107017", "model": "llama", "target_model": "claude", "recognition_score": 0.7325918548485711, "ground_truth": 0}, {"key": "38107017", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7310585769825901, "ground_truth": 0}, {"key": "38107017", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7943849475768313, "ground_truth": 0}, {"key": "40046472", "model": "llama", "target_model": "llama", "recognition_score": 0.2893717023450211, "ground_truth": 1}, {"key": "40046472", "model": "llama", "target_model": "human", "recognition_score": 0.8354835416157415, "ground_truth": 0}, {"key": "40046472", "model": "llama", "target_model": "claude", "recognition_score": 0.803173794250912, "ground_truth": 0}, {"key": "40046472", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6723317093455631, "ground_truth": 0}, {"key": "40046472", "model": "llama", "target_model": "gpt35", "recognition_score": 0.49804687608464465, "ground_truth": 0}, {"key": "32157820", "model": "llama", "target_model": "llama", "recognition_score": 0.7648916079744184, "ground_truth": 1}, {"key": "32157820", "model": "llama", "target_model": "human", "recognition_score": 0.8624675441978503, "ground_truth": 0}, {"key": "32157820", "model": "llama", "target_model": "claude", "recognition_score": 0.6976089187803695, "ground_truth": 0}, {"key": "32157820", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6992544151812391, "ground_truth": 0}, {"key": "32157820", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8661325180286887, "ground_truth": 0}, {"key": "41004037", "model": "llama", "target_model": "llama", "recognition_score": 0.8840392773732797, "ground_truth": 1}, {"key": "41004037", "model": "llama", "target_model": "human", "recognition_score": 0.7341195217164777, "ground_truth": 0}, {"key": "41004037", "model": "llama", "target_model": "claude", "recognition_score": 0.6654105469021874, "ground_truth": 0}, {"key": "41004037", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7931059490745842, "ground_truth": 0}, {"key": "41004037", "model": "llama", "target_model": "gpt35", "recognition_score": 0.850964689923496, "ground_truth": 0}, {"key": "21387993", "model": "llama", "target_model": "llama", "recognition_score": 0.7154240081418047, "ground_truth": 1}, {"key": "21387993", "model": "llama", "target_model": "human", "recognition_score": 0.7676898447441025, "ground_truth": 0}, {"key": "21387993", "model": "llama", "target_model": "claude", "recognition_score": 0.6206216098446855, "ground_truth": 0}, {"key": "21387993", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7813306138503822, "ground_truth": 0}, {"key": "21387993", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8661325115562404, "ground_truth": 0}, {"key": "34665539", "model": "llama", "target_model": "llama", "recognition_score": 0.6876300031741588, "ground_truth": 1}, {"key": "34665539", "model": "llama", "target_model": "human", "recognition_score": 0.6169358214306473, "ground_truth": 0}, {"key": "34665539", "model": "llama", "target_model": "claude", "recognition_score": 0.7122322113224284, "ground_truth": 0}, {"key": "34665539", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7248702932123146, "ground_truth": 0}, {"key": "34665539", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7931059509562322, "ground_truth": 0}, {"key": "37872111", "model": "llama", "target_model": "llama", "recognition_score": 0.46295860235789466, "ground_truth": 1}, {"key": "37872111", "model": "llama", "target_model": "human", "recognition_score": 0.8670357501374872, "ground_truth": 0}, {"key": "37872111", "model": "llama", "target_model": "claude", "recognition_score": 0.9066531200529537, "ground_truth": 0}, {"key": "37872111", "model": "llama", "target_model": "gpt4", "recognition_score": 0.44167301707539336, "ground_truth": 0}, {"key": "37872111", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7994423126168276, "ground_truth": 0}, {"key": "36629542", "model": "llama", "target_model": "llama", "recognition_score": 0.8984105549278585, "ground_truth": 1}, {"key": "36629542", "model": "llama", "target_model": "human", "recognition_score": 0.8068526346612276, "ground_truth": 0}, {"key": "36629542", "model": "llama", "target_model": "claude", "recognition_score": 0.8947894616560871, "ground_truth": 0}, {"key": "36629542", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7248702868373441, "ground_truth": 0}, {"key": "36629542", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8757870003364524, "ground_truth": 0}, {"key": "36487527", "model": "llama", "target_model": "llama", "recognition_score": 0.9111797071859532, "ground_truth": 1}, {"key": "36487527", "model": "llama", "target_model": "human", "recognition_score": 0.594551261639773, "ground_truth": 0}, {"key": "36487527", "model": "llama", "target_model": "claude", "recognition_score": 0.838679771254597, "ground_truth": 0}, {"key": "36487527", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8940517199234581, "ground_truth": 0}, {"key": "36487527", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8910549593520352, "ground_truth": 0}, {"key": "37344756", "model": "llama", "target_model": "llama", "recognition_score": 0.9441768611475106, "ground_truth": 1}, {"key": "37344756", "model": "llama", "target_model": "human", "recognition_score": 0.8596637443884247, "ground_truth": 0}, {"key": "37344756", "model": "llama", "target_model": "claude", "recognition_score": 0.9294404071737119, "ground_truth": 0}, {"key": "37344756", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8568122966984684, "ground_truth": 0}, {"key": "37344756", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9142907283290499, "ground_truth": 0}, {"key": "38707722", "model": "llama", "target_model": "llama", "recognition_score": 0.5273165398246503, "ground_truth": 1}, {"key": "38707722", "model": "llama", "target_model": "human", "recognition_score": 0.5195213592548374, "ground_truth": 0}, {"key": "38707722", "model": "llama", "target_model": "claude", "recognition_score": 0.5717666118153187, "ground_truth": 0}, {"key": "38707722", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7295197917583774, "ground_truth": 0}, {"key": "38707722", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7310585709766606, "ground_truth": 0}, {"key": "37093419", "model": "llama", "target_model": "llama", "recognition_score": 0.3647775856610224, "ground_truth": 1}, {"key": "37093419", "model": "llama", "target_model": "human", "recognition_score": 0.09877258903289488, "ground_truth": 0}, {"key": "37093419", "model": "llama", "target_model": "claude", "recognition_score": 0.3684056866427929, "ground_truth": 0}, {"key": "37093419", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2107662966739342, "ground_truth": 0}, {"key": "37093419", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4054487220633993, "ground_truth": 0}, {"key": "35547391", "model": "llama", "target_model": "llama", "recognition_score": 0.7826624781781204, "ground_truth": 1}, {"key": "35547391", "model": "llama", "target_model": "human", "recognition_score": 0.7534666785727122, "ground_truth": 0}, {"key": "35547391", "model": "llama", "target_model": "claude", "recognition_score": 0.7341195541889812, "ground_truth": 0}, {"key": "35547391", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7310585683145955, "ground_truth": 0}, {"key": "35547391", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8459424476682647, "ground_truth": 0}, {"key": "37173168", "model": "llama", "target_model": "llama", "recognition_score": 0.8509646988134038, "ground_truth": 1}, {"key": "37173168", "model": "llama", "target_model": "human", "recognition_score": 0.8198933418432558, "ground_truth": 0}, {"key": "37173168", "model": "llama", "target_model": "claude", "recognition_score": 0.8661325185094025, "ground_truth": 0}, {"key": "37173168", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7634837619648458, "ground_truth": 0}, {"key": "37173168", "model": "llama", "target_model": "gpt35", "recognition_score": 0.769080235099127, "ground_truth": 0}, {"key": "30725298", "model": "llama", "target_model": "llama", "recognition_score": 0.8774767890691628, "ground_truth": 1}, {"key": "30725298", "model": "llama", "target_model": "human", "recognition_score": 0.8289388026874548, "ground_truth": 0}, {"key": "30725298", "model": "llama", "target_model": "claude", "recognition_score": 0.828938811953253, "ground_truth": 0}, {"key": "30725298", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8848377693305528, "ground_truth": 0}, {"key": "30725298", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8116760233373637, "ground_truth": 0}, {"key": "33830573", "model": "llama", "target_model": "llama", "recognition_score": 0.9367494743790415, "ground_truth": 1}, {"key": "33830573", "model": "llama", "target_model": "human", "recognition_score": 0.873214828933228, "ground_truth": 0}, {"key": "33830573", "model": "llama", "target_model": "claude", "recognition_score": 0.8221891182211172, "ground_truth": 0}, {"key": "33830573", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9489172610239889, "ground_truth": 0}, {"key": "33830573", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7648916175499604, "ground_truth": 0}, {"key": "33415474", "model": "llama", "target_model": "llama", "recognition_score": 0.16026602489841646, "ground_truth": 1}, {"key": "33415474", "model": "llama", "target_model": "human", "recognition_score": 0.2393493516666555, "ground_truth": 0}, {"key": "33415474", "model": "llama", "target_model": "claude", "recognition_score": 0.18126320138351656, "ground_truth": 0}, {"key": "33415474", "model": "llama", "target_model": "gpt4", "recognition_score": 0.19559407075846957, "ground_truth": 0}, {"key": "33415474", "model": "llama", "target_model": "gpt35", "recognition_score": 0.1645164551620461, "ground_truth": 0}, {"key": "37383994", "model": "llama", "target_model": "llama", "recognition_score": 0.9529258207136571, "ground_truth": 1}, {"key": "37383994", "model": "llama", "target_model": "human", "recognition_score": 0.980129287586846, "ground_truth": 0}, {"key": "37383994", "model": "llama", "target_model": "claude", "recognition_score": 0.96641049036005, "ground_truth": 0}, {"key": "37383994", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9715639654212006, "ground_truth": 0}, {"key": "37383994", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9717790155539999, "ground_truth": 0}, {"key": "38576819", "model": "llama", "target_model": "llama", "recognition_score": 0.5679365975525221, "ground_truth": 1}, {"key": "38576819", "model": "llama", "target_model": "human", "recognition_score": 0.7295197953833431, "ground_truth": 0}, {"key": "38576819", "model": "llama", "target_model": "claude", "recognition_score": 0.6442250770876609, "ground_truth": 0}, {"key": "38576819", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7122322036793858, "ground_truth": 0}, {"key": "38576819", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6076631543987672, "ground_truth": 0}, {"key": "34500226", "model": "llama", "target_model": "llama", "recognition_score": 0.6825737249386293, "ground_truth": 1}, {"key": "34500226", "model": "llama", "target_model": "human", "recognition_score": 0.7325918512965272, "ground_truth": 0}, {"key": "34500226", "model": "llama", "target_model": "claude", "recognition_score": 0.7549150041946461, "ground_truth": 0}, {"key": "34500226", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7969253792602705, "ground_truth": 0}, {"key": "34500226", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7648916199871864, "ground_truth": 0}, {"key": "39856394", "model": "llama", "target_model": "llama", "recognition_score": 0.8652240824621162, "ground_truth": 1}, {"key": "39856394", "model": "llama", "target_model": "human", "recognition_score": 0.7772998690133416, "ground_truth": 0}, {"key": "39856394", "model": "llama", "target_model": "claude", "recognition_score": 0.8519528132505406, "ground_truth": 0}, {"key": "39856394", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8128673304763023, "ground_truth": 0}, {"key": "39856394", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7813306201415622, "ground_truth": 0}, {"key": "35499522", "model": "llama", "target_model": "llama", "recognition_score": 0.24653334893642576, "ground_truth": 1}, {"key": "35499522", "model": "llama", "target_model": "human", "recognition_score": 0.3629692099989223, "ground_truth": 0}, {"key": "35499522", "model": "llama", "target_model": "claude", "recognition_score": 0.17328821471002126, "ground_truth": 0}, {"key": "35499522", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4455295106246985, "ground_truth": 0}, {"key": "35499522", "model": "llama", "target_model": "gpt35", "recognition_score": 0.15507846483372342, "ground_truth": 0}, {"key": "30157766", "model": "llama", "target_model": "llama", "recognition_score": 0.8955226712211973, "ground_truth": 1}, {"key": "30157766", "model": "llama", "target_model": "human", "recognition_score": 0.9329437085307445, "ground_truth": 0}, {"key": "30157766", "model": "llama", "target_model": "claude", "recognition_score": 0.8962513677129196, "ground_truth": 0}, {"key": "30157766", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9167080798841816, "ground_truth": 0}, {"key": "30157766", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9559813552733031, "ground_truth": 0}, {"key": "40472346", "model": "llama", "target_model": "llama", "recognition_score": 0.9329437060164136, "ground_truth": 1}, {"key": "40472346", "model": "llama", "target_model": "human", "recognition_score": 0.8499711711345165, "ground_truth": 0}, {"key": "40472346", "model": "llama", "target_model": "claude", "recognition_score": 0.8832359853258506, "ground_truth": 0}, {"key": "40472346", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9399133446264875, "ground_truth": 0}, {"key": "40472346", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9178933796599051, "ground_truth": 0}, {"key": "35305635", "model": "llama", "target_model": "llama", "recognition_score": 0.964589269676505, "ground_truth": 1}, {"key": "35305635", "model": "llama", "target_model": "human", "recognition_score": 0.9343951644318339, "ground_truth": 0}, {"key": "35305635", "model": "llama", "target_model": "claude", "recognition_score": 0.94208191487966, "ground_truth": 0}, {"key": "35305635", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9690910423438726, "ground_truth": 0}, {"key": "35305635", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9334308168473096, "ground_truth": 0}, {"key": "32495926", "model": "llama", "target_model": "llama", "recognition_score": 0.9039745149325218, "ground_truth": 1}, {"key": "32495926", "model": "llama", "target_model": "human", "recognition_score": 0.7981867816342401, "ground_truth": 0}, {"key": "32495926", "model": "llama", "target_model": "claude", "recognition_score": 0.9026096050490097, "ground_truth": 0}, {"key": "32495926", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7931059328420371, "ground_truth": 0}, {"key": "32495926", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8624675239674472, "ground_truth": 0}, {"key": "37353801", "model": "llama", "target_model": "llama", "recognition_score": 0.4629586253670161, "ground_truth": 1}, {"key": "37353801", "model": "llama", "target_model": "human", "recognition_score": 0.44746030828928124, "ground_truth": 0}, {"key": "37353801", "model": "llama", "target_model": "claude", "recognition_score": 0.6206216120705825, "ground_truth": 0}, {"key": "37353801", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6959583313292121, "ground_truth": 0}, {"key": "37353801", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6095241818007462, "ground_truth": 0}, {"key": "30159904", "model": "llama", "target_model": "llama", "recognition_score": 0.8879840440553195, "ground_truth": 1}, {"key": "30159904", "model": "llama", "target_model": "human", "recognition_score": 0.6636689490538867, "ground_truth": 0}, {"key": "30159904", "model": "llama", "target_model": "claude", "recognition_score": 0.7956581032570593, "ground_truth": 0}, {"key": "30159904", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8499711689174893, "ground_truth": 0}, {"key": "30159904", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8633916120207193, "ground_truth": 0}, {"key": "33698679", "model": "llama", "target_model": "llama", "recognition_score": 0.8397339648898884, "ground_truth": 1}, {"key": "33698679", "model": "llama", "target_model": "human", "recognition_score": 0.8333245834982789, "ground_truth": 0}, {"key": "33698679", "model": "llama", "target_model": "claude", "recognition_score": 0.7520125855665053, "ground_truth": 0}, {"key": "33698679", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6876299957440435, "ground_truth": 0}, {"key": "33698679", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9118099531711923, "ground_truth": 0}, {"key": "40530172", "model": "llama", "target_model": "llama", "recognition_score": 0.9715639649353307, "ground_truth": 1}, {"key": "40530172", "model": "llama", "target_model": "human", "recognition_score": 0.7592254262653864, "ground_truth": 0}, {"key": "40530172", "model": "llama", "target_model": "claude", "recognition_score": 0.8044059104286706, "ground_truth": 0}, {"key": "40530172", "model": "llama", "target_model": "gpt4", "recognition_score": 0.777299873669604, "ground_truth": 0}, {"key": "40530172", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7356416311463944, "ground_truth": 0}, {"key": "40652941", "model": "llama", "target_model": "llama", "recognition_score": 0.9575961732733559, "ground_truth": 1}, {"key": "40652941", "model": "llama", "target_model": "human", "recognition_score": 0.7866228283037817, "ground_truth": 0}, {"key": "40652941", "model": "llama", "target_model": "claude", "recognition_score": 0.9618217263113761, "ground_truth": 0}, {"key": "40652941", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9012274034555813, "ground_truth": 0}, {"key": "40652941", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8991213764265524, "ground_truth": 0}, {"key": "40122246", "model": "llama", "target_model": "llama", "recognition_score": 0.31405057148819054, "ground_truth": 1}, {"key": "40122246", "model": "llama", "target_model": "human", "recognition_score": 0.20181322425872142, "ground_truth": 0}, {"key": "40122246", "model": "llama", "target_model": "claude", "recognition_score": 0.26133092903505684, "ground_truth": 0}, {"key": "40122246", "model": "llama", "target_model": "gpt4", "recognition_score": 0.20181322288174172, "ground_truth": 0}, {"key": "40122246", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4263215911915483, "ground_truth": 0}, {"key": "40032656", "model": "llama", "target_model": "llama", "recognition_score": 0.898410549664322, "ground_truth": 1}, {"key": "40032656", "model": "llama", "target_model": "human", "recognition_score": 0.8633916196083242, "ground_truth": 0}, {"key": "40032656", "model": "llama", "target_model": "claude", "recognition_score": 0.9235923101137608, "ground_truth": 0}, {"key": "40032656", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8879840520436065, "ground_truth": 0}, {"key": "40032656", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8872046036310489, "ground_truth": 0}, {"key": "38913680", "model": "llama", "target_model": "llama", "recognition_score": 0.7356416473748982, "ground_truth": 1}, {"key": "38913680", "model": "llama", "target_model": "human", "recognition_score": 0.5448013968263189, "ground_truth": 0}, {"key": "38913680", "model": "llama", "target_model": "claude", "recognition_score": 0.5983122088106234, "ground_truth": 0}, {"key": "38913680", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6187804688785581, "ground_truth": 0}, {"key": "38913680", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8278281536900518, "ground_truth": 0}, {"key": "17608039", "model": "llama", "target_model": "llama", "recognition_score": 0.6095241513384179, "ground_truth": 1}, {"key": "17608039", "model": "llama", "target_model": "human", "recognition_score": 0.5175708943331542, "ground_truth": 0}, {"key": "17608039", "model": "llama", "target_model": "claude", "recognition_score": 0.4863315181948201, "ground_truth": 0}, {"key": "17608039", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4282334016412985, "ground_truth": 0}, {"key": "17608039", "model": "llama", "target_model": "gpt35", "recognition_score": 0.40356683164009394, "ground_truth": 0}, {"key": "40434901", "model": "llama", "target_model": "llama", "recognition_score": 0.9618217261726201, "ground_truth": 1}, {"key": "40434901", "model": "llama", "target_model": "human", "recognition_score": 0.9005297879816717, "ground_truth": 0}, {"key": "40434901", "model": "llama", "target_model": "claude", "recognition_score": 0.9111797091180373, "ground_truth": 0}, {"key": "40434901", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9686195695139602, "ground_truth": 0}, {"key": "40434901", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9594592609814332, "ground_truth": 0}, {"key": "37680058", "model": "llama", "target_model": "llama", "recognition_score": 0.34864514208779335, "ground_truth": 1}, {"key": "37680058", "model": "llama", "target_model": "human", "recognition_score": 0.3174262375878858, "ground_truth": 0}, {"key": "37680058", "model": "llama", "target_model": "claude", "recognition_score": 0.2509127652189853, "ground_truth": 0}, {"key": "37680058", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "37680058", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6020616170581528, "ground_truth": 0}, {"key": "37291821", "model": "llama", "target_model": "llama", "recognition_score": 0.8615382178159907, "ground_truth": 1}, {"key": "37291821", "model": "llama", "target_model": "human", "recognition_score": 0.8652240873508544, "ground_truth": 0}, {"key": "37291821", "model": "llama", "target_model": "claude", "recognition_score": 0.7853085847011835, "ground_truth": 0}, {"key": "37291821", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8255897109540087, "ground_truth": 0}, {"key": "37291821", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9046505357034352, "ground_truth": 0}, {"key": "41002743", "model": "llama", "target_model": "llama", "recognition_score": 0.7401743554414807, "ground_truth": 1}, {"key": "41002743", "model": "llama", "target_model": "human", "recognition_score": 0.718594374456273, "ground_truth": 0}, {"key": "41002743", "model": "llama", "target_model": "claude", "recognition_score": 0.7690802316592585, "ground_truth": 0}, {"key": "41002743", "model": "llama", "target_model": "gpt4", "recognition_score": 0.837619962326371, "ground_truth": 0}, {"key": "41002743", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8539127347079646, "ground_truth": 0}, {"key": "36322869", "model": "llama", "target_model": "llama", "recognition_score": 0.8947894537778844, "ground_truth": 1}, {"key": "36322869", "model": "llama", "target_model": "human", "recognition_score": 0.9213576157565685, "ground_truth": 0}, {"key": "36322869", "model": "llama", "target_model": "claude", "recognition_score": 0.944176859795454, "ground_truth": 0}, {"key": "36322869", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9019206731818448, "ground_truth": 0}, {"key": "36322869", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6876299862570664, "ground_truth": 0}, {"key": "39459717", "model": "llama", "target_model": "llama", "recognition_score": 0.8198933275519107, "ground_truth": 1}, {"key": "39459717", "model": "llama", "target_model": "human", "recognition_score": 0.8333245826720268, "ground_truth": 0}, {"key": "39459717", "model": "llama", "target_model": "claude", "recognition_score": 0.9053222982229648, "ground_truth": 0}, {"key": "39459717", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8615382145112311, "ground_truth": 0}, {"key": "39459717", "model": "llama", "target_model": "gpt35", "recognition_score": 0.867035756681898, "ground_truth": 0}, {"key": "36503727", "model": "llama", "target_model": "llama", "recognition_score": 0.7534666552055675, "ground_truth": 1}, {"key": "36503727", "model": "llama", "target_model": "human", "recognition_score": 0.6113819859568183, "ground_truth": 0}, {"key": "36503727", "model": "llama", "target_model": "claude", "recognition_score": 0.6531269160061965, "ground_truth": 0}, {"key": "36503727", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8278281464234328, "ground_truth": 0}, {"key": "36503727", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8479677555736558, "ground_truth": 0}, {"key": "35682367", "model": "llama", "target_model": "llama", "recognition_score": 0.9429285975677563, "ground_truth": 1}, {"key": "35682367", "model": "llama", "target_model": "human", "recognition_score": 0.9787126484677615, "ground_truth": 0}, {"key": "35682367", "model": "llama", "target_model": "claude", "recognition_score": 0.8723473877050465, "ground_truth": 0}, {"key": "35682367", "model": "llama", "target_model": "gpt4", "recognition_score": 0.942081914114947, "ground_truth": 0}, {"key": "35682367", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8152324764152208, "ground_truth": 0}, {"key": "36472353", "model": "llama", "target_model": "llama", "recognition_score": 0.727975463919293, "ground_truth": 1}, {"key": "36472353", "model": "llama", "target_model": "human", "recognition_score": 0.7620701025286123, "ground_truth": 0}, {"key": "36472353", "model": "llama", "target_model": "claude", "recognition_score": 0.7341195475398733, "ground_truth": 0}, {"key": "36472353", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6808786166701983, "ground_truth": 0}, {"key": "36472353", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5869964321520607, "ground_truth": 0}, {"key": "37651907", "model": "llama", "target_model": "llama", "recognition_score": 0.8221891433986256, "ground_truth": 1}, {"key": "37651907", "model": "llama", "target_model": "human", "recognition_score": 0.7745833730530912, "ground_truth": 0}, {"key": "37651907", "model": "llama", "target_model": "claude", "recognition_score": 0.6774740174190267, "ground_truth": 0}, {"key": "37651907", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7446563472109553, "ground_truth": 0}, {"key": "37651907", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6688802864546504, "ground_truth": 0}, {"key": "36255476", "model": "llama", "target_model": "llama", "recognition_score": 0.8407825907766929, "ground_truth": 1}, {"key": "36255476", "model": "llama", "target_model": "human", "recognition_score": 0.7577943828123079, "ground_truth": 0}, {"key": "36255476", "model": "llama", "target_model": "claude", "recognition_score": 0.8816149182437436, "ground_truth": 0}, {"key": "36255476", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8848377688339282, "ground_truth": 0}, {"key": "36255476", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7490872103212329, "ground_truth": 0}, {"key": "37283518", "model": "llama", "target_model": "llama", "recognition_score": 0.8962513677031898, "ground_truth": 1}, {"key": "37283518", "model": "llama", "target_model": "human", "recognition_score": 0.8807970826873203, "ground_truth": 0}, {"key": "37283518", "model": "llama", "target_model": "claude", "recognition_score": 0.86613252593043, "ground_truth": 0}, {"key": "37283518", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9099069965354127, "ground_truth": 0}, {"key": "37283518", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8807970727193206, "ground_truth": 0}, {"key": "34906785", "model": "llama", "target_model": "llama", "recognition_score": 0.823328408369672, "ground_truth": 1}, {"key": "34906785", "model": "llama", "target_model": "human", "recognition_score": 0.8539127471818384, "ground_truth": 0}, {"key": "34906785", "model": "llama", "target_model": "claude", "recognition_score": 0.7520125622300717, "ground_truth": 0}, {"key": "34906785", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7279754537413995, "ground_truth": 0}, {"key": "34906785", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7648915942608165, "ground_truth": 0}, {"key": "34965328", "model": "llama", "target_model": "llama", "recognition_score": 0.874077238372357, "ground_truth": 1}, {"key": "34965328", "model": "llama", "target_model": "human", "recognition_score": 0.9257686274312171, "ground_truth": 0}, {"key": "34965328", "model": "llama", "target_model": "claude", "recognition_score": 0.9184802374388142, "ground_truth": 0}, {"key": "34965328", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8705972598826146, "ground_truth": 0}, {"key": "34965328", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8879840447724215, "ground_truth": 0}, {"key": "38788440", "model": "llama", "target_model": "llama", "recognition_score": 0.685949452830674, "ground_truth": 1}, {"key": "38788440", "model": "llama", "target_model": "human", "recognition_score": 0.6132365412099579, "ground_truth": 0}, {"key": "38788440", "model": "llama", "target_model": "claude", "recognition_score": 0.509764402797104, "ground_truth": 0}, {"key": "38788440", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5621764924094158, "ground_truth": 0}, {"key": "38788440", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6206216093883964, "ground_truth": 0}, {"key": "35046866", "model": "llama", "target_model": "llama", "recognition_score": 0.9230391706002671, "ground_truth": 1}, {"key": "35046866", "model": "llama", "target_model": "human", "recognition_score": 0.9202179914184054, "ground_truth": 0}, {"key": "35046866", "model": "llama", "target_model": "claude", "recognition_score": 0.9202179891102782, "ground_truth": 0}, {"key": "35046866", "model": "llama", "target_model": "gpt4", "recognition_score": 0.926835271437021, "ground_truth": 0}, {"key": "35046866", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9066531268417609, "ground_truth": 0}, {"key": "37629558", "model": "llama", "target_model": "llama", "recognition_score": 0.7401743569428262, "ground_truth": 1}, {"key": "37629558", "model": "llama", "target_model": "human", "recognition_score": 0.875786996460639, "ground_truth": 0}, {"key": "37629558", "model": "llama", "target_model": "claude", "recognition_score": 0.6460137046558431, "ground_truth": 0}, {"key": "37629558", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7772998678866484, "ground_truth": 0}, {"key": "37629558", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6992544192768979, "ground_truth": 0}, {"key": "33859914", "model": "llama", "target_model": "llama", "recognition_score": 0.7745833620858036, "ground_truth": 1}, {"key": "33859914", "model": "llama", "target_model": "human", "recognition_score": 0.8152324837960968, "ground_truth": 0}, {"key": "33859914", "model": "llama", "target_model": "claude", "recognition_score": 0.903974507713223, "ground_truth": 0}, {"key": "33859914", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8670357581603446, "ground_truth": 0}, {"key": "33859914", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8438950937907097, "ground_truth": 0}, {"key": "39790523", "model": "llama", "target_model": "llama", "recognition_score": 0.9367494819377153, "ground_truth": 1}, {"key": "39790523", "model": "llama", "target_model": "human", "recognition_score": 0.9039744989791032, "ground_truth": 0}, {"key": "39790523", "model": "llama", "target_model": "claude", "recognition_score": 0.888758790495325, "ground_truth": 0}, {"key": "39790523", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9268352743249157, "ground_truth": 0}, {"key": "39790523", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9149009509849333, "ground_truth": 0}, {"key": "33509656", "model": "llama", "target_model": "llama", "recognition_score": 0.6943026837286342, "ground_truth": 1}, {"key": "33509656", "model": "llama", "target_model": "human", "recognition_score": 0.661922900127787, "ground_truth": 0}, {"key": "33509656", "model": "llama", "target_model": "claude", "recognition_score": 0.3140505370855669, "ground_truth": 0}, {"key": "33509656", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7431680049662038, "ground_truth": 0}, {"key": "33509656", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5602526494449985, "ground_truth": 0}, {"key": "17380923", "model": "llama", "target_model": "llama", "recognition_score": 0.8705972739581349, "ground_truth": 1}, {"key": "17380923", "model": "llama", "target_model": "human", "recognition_score": 0.844921523309009, "ground_truth": 0}, {"key": "17380923", "model": "llama", "target_model": "claude", "recognition_score": 0.9284087974476314, "ground_truth": 0}, {"key": "17380923", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9635062354577565, "ground_truth": 0}, {"key": "17380923", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8354835221056186, "ground_truth": 0}, {"key": "36202526", "model": "llama", "target_model": "llama", "recognition_score": 0.6132365564308787, "ground_truth": 1}, {"key": "36202526", "model": "llama", "target_model": "human", "recognition_score": 0.7662936364797325, "ground_truth": 0}, {"key": "36202526", "model": "llama", "target_model": "claude", "recognition_score": 0.7201715036224475, "ground_truth": 0}, {"key": "36202526", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8449215308350257, "ground_truth": 0}, {"key": "36202526", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8365545669156846, "ground_truth": 0}, {"key": "26419232", "model": "llama", "target_model": "llama", "recognition_score": 0.6297745780931803, "ground_truth": 1}, {"key": "26419232", "model": "llama", "target_model": "human", "recognition_score": 0.8397339763427442, "ground_truth": 0}, {"key": "26419232", "model": "llama", "target_model": "claude", "recognition_score": 0.8289388103838831, "ground_truth": 0}, {"key": "26419232", "model": "llama", "target_model": "gpt4", "recognition_score": 0.713830748409236, "ground_truth": 0}, {"key": "26419232", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7879311897880062, "ground_truth": 0}, {"key": "34232398", "model": "llama", "target_model": "llama", "recognition_score": 0.7931059582095639, "ground_truth": 1}, {"key": "34232398", "model": "llama", "target_model": "human", "recognition_score": 0.8947894587938243, "ground_truth": 0}, {"key": "34232398", "model": "llama", "target_model": "claude", "recognition_score": 0.8267117945313399, "ground_truth": 0}, {"key": "34232398", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8428631374209065, "ground_truth": 0}, {"key": "34232398", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7325918477109983, "ground_truth": 0}, {"key": "33586045", "model": "llama", "target_model": "llama", "recognition_score": 0.9105453973670379, "ground_truth": 1}, {"key": "33586045", "model": "llama", "target_model": "human", "recognition_score": 0.8902942257333321, "ground_truth": 0}, {"key": "33586045", "model": "llama", "target_model": "claude", "recognition_score": 0.8766343818613735, "ground_truth": 0}, {"key": "33586045", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8824278673303727, "ground_truth": 0}, {"key": "33586045", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9130583340185717, "ground_truth": 0}, {"key": "32281151", "model": "llama", "target_model": "llama", "recognition_score": 0.7185944127277422, "ground_truth": 1}, {"key": "32281151", "model": "llama", "target_model": "human", "recognition_score": 0.6206216336258673, "ground_truth": 0}, {"key": "32281151", "model": "llama", "target_model": "claude", "recognition_score": 0.48242909464865996, "ground_truth": 0}, {"key": "32281151", "model": "llama", "target_model": "gpt4", "recognition_score": 0.51952131240107, "ground_truth": 0}, {"key": "32281151", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6370307805353554, "ground_truth": 0}, {"key": "37308159", "model": "llama", "target_model": "llama", "recognition_score": 0.8955226788679462, "ground_truth": 1}, {"key": "37308159", "model": "llama", "target_model": "human", "recognition_score": 0.9651191127386631, "ground_truth": 0}, {"key": "37308159", "model": "llama", "target_model": "claude", "recognition_score": 0.9362850062055995, "ground_truth": 0}, {"key": "37308159", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9648551525174504, "ground_truth": 0}, {"key": "37308159", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9453993968387729, "ground_truth": 0}, {"key": "35694408", "model": "llama", "target_model": "llama", "recognition_score": 0.8757869834463394, "ground_truth": 1}, {"key": "35694408", "model": "llama", "target_model": "human", "recognition_score": 0.9788748056155127, "ground_truth": 0}, {"key": "35694408", "model": "llama", "target_model": "claude", "recognition_score": 0.9207896722369223, "ground_truth": 0}, {"key": "35694408", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8791467835511865, "ground_truth": 0}, {"key": "35694408", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8902942226457939, "ground_truth": 0}, {"key": "39781995", "model": "llama", "target_model": "llama", "recognition_score": 0.4397473367837077, "ground_truth": 1}, {"key": "39781995", "model": "llama", "target_model": "human", "recognition_score": 0.5370414175933671, "ground_truth": 0}, {"key": "39781995", "model": "llama", "target_model": "claude", "recognition_score": 0.5467381556769593, "ground_truth": 0}, {"key": "39781995", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2814056215918467, "ground_truth": 0}, {"key": "39781995", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7154240007789953, "ground_truth": 0}, {"key": "22799372", "model": "llama", "target_model": "llama", "recognition_score": 0.9518632352736267, "ground_truth": 1}, {"key": "22799372", "model": "llama", "target_model": "human", "recognition_score": 0.9795114439759228, "ground_truth": 0}, {"key": "22799372", "model": "llama", "target_model": "claude", "recognition_score": 0.9799765596576997, "ground_truth": 0}, {"key": "22799372", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9763105294756327, "ground_truth": 0}, {"key": "22799372", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9882221582994477, "ground_truth": 0}, {"key": "37428240", "model": "llama", "target_model": "llama", "recognition_score": 0.8244619240681555, "ground_truth": 1}, {"key": "37428240", "model": "llama", "target_model": "human", "recognition_score": 0.7879311870056692, "ground_truth": 0}, {"key": "37428240", "model": "llama", "target_model": "claude", "recognition_score": 0.8175744804297687, "ground_truth": 0}, {"key": "37428240", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8300437743917939, "ground_truth": 0}, {"key": "37428240", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7154239994173771, "ground_truth": 0}, {"key": "40612657", "model": "llama", "target_model": "llama", "recognition_score": 0.9804313220991298, "ground_truth": 1}, {"key": "40612657", "model": "llama", "target_model": "human", "recognition_score": 0.9905874105139346, "ground_truth": 0}, {"key": "40612657", "model": "llama", "target_model": "claude", "recognition_score": 0.9600626839504057, "ground_truth": 0}, {"key": "40612657", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9793540713586283, "ground_truth": 0}, {"key": "40612657", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9728307694403848, "ground_truth": 0}, {"key": "34404662", "model": "llama", "target_model": "llama", "recognition_score": 0.8969755713125396, "ground_truth": 1}, {"key": "34404662", "model": "llama", "target_model": "human", "recognition_score": 0.8856314836772736, "ground_truth": 0}, {"key": "34404662", "model": "llama", "target_model": "claude", "recognition_score": 0.927887797914026, "ground_truth": 0}, {"key": "34404662", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9273632884076827, "ground_truth": 0}, {"key": "34404662", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8019358277266055, "ground_truth": 0}, {"key": "32619704", "model": "llama", "target_model": "llama", "recognition_score": 0.692642004675639, "ground_truth": 1}, {"key": "32619704", "model": "llama", "target_model": "human", "recognition_score": 0.8300437693482922, "ground_truth": 0}, {"key": "32619704", "model": "llama", "target_model": "claude", "recognition_score": 0.8895288534216683, "ground_truth": 0}, {"key": "32619704", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7476159515089994, "ground_truth": 0}, {"key": "32619704", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7772998585925264, "ground_truth": 0}, {"key": "39014883", "model": "llama", "target_model": "llama", "recognition_score": 0.7956581120275492, "ground_truth": 1}, {"key": "39014883", "model": "llama", "target_model": "human", "recognition_score": 0.791821075573076, "ground_truth": 0}, {"key": "39014883", "model": "llama", "target_model": "claude", "recognition_score": 0.7446563545848653, "ground_truth": 0}, {"key": "39014883", "model": "llama", "target_model": "gpt4", "recognition_score": 0.762070114376909, "ground_truth": 0}, {"key": "39014883", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7233094819917147, "ground_truth": 0}, {"key": "37982812", "model": "llama", "target_model": "llama", "recognition_score": 0.8633916099153109, "ground_truth": 1}, {"key": "37982812", "model": "llama", "target_model": "human", "recognition_score": 0.8783142474512311, "ground_truth": 0}, {"key": "37982812", "model": "llama", "target_model": "claude", "recognition_score": 0.9734434267902747, "ground_truth": 0}, {"key": "37982812", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8848377620830079, "ground_truth": 0}, {"key": "37982812", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9178933728481785, "ground_truth": 0}, {"key": "28123476", "model": "llama", "target_model": "llama", "recognition_score": 0.9284087979328223, "ground_truth": 1}, {"key": "28123476", "model": "llama", "target_model": "human", "recognition_score": 0.8152324844676447, "ground_truth": 0}, {"key": "28123476", "model": "llama", "target_model": "claude", "recognition_score": 0.8933094050797149, "ground_truth": 0}, {"key": "28123476", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8615382158311709, "ground_truth": 0}, {"key": "28123476", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9343951599381995, "ground_truth": 0}, {"key": "39078849", "model": "llama", "target_model": "llama", "recognition_score": 0.7994423156550461, "ground_truth": 1}, {"key": "39078849", "model": "llama", "target_model": "human", "recognition_score": 0.7676898695366012, "ground_truth": 0}, {"key": "39078849", "model": "llama", "target_model": "claude", "recognition_score": 0.8774767748465364, "ground_truth": 0}, {"key": "39078849", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8031738053909462, "ground_truth": 0}, {"key": "39078849", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7461389894753601, "ground_truth": 0}, {"key": "39414137", "model": "llama", "target_model": "llama", "recognition_score": 0.9615338056038516, "ground_truth": 1}, {"key": "39414137", "model": "llama", "target_model": "human", "recognition_score": 0.9257686361320521, "ground_truth": 0}, {"key": "39414137", "model": "llama", "target_model": "claude", "recognition_score": 0.9257686210304271, "ground_truth": 0}, {"key": "39414137", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9372107919480889, "ground_truth": 0}, {"key": "39414137", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9597620539593986, "ground_truth": 0}, {"key": "37371354", "model": "llama", "target_model": "llama", "recognition_score": 0.7461389879514676, "ground_truth": 1}, {"key": "37371354", "model": "llama", "target_model": "human", "recognition_score": 0.8679338292916274, "ground_truth": 0}, {"key": "37371354", "model": "llama", "target_model": "claude", "recognition_score": 0.6909762678802844, "ground_truth": 0}, {"key": "37371354", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8449215228486033, "ground_truth": 0}, {"key": "37371354", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7386690755132894, "ground_truth": 0}, {"key": "29497179", "model": "llama", "target_model": "llama", "recognition_score": 0.965899574961649, "ground_truth": 1}, {"key": "29497179", "model": "llama", "target_model": "human", "recognition_score": 0.8418256598945694, "ground_truth": 0}, {"key": "29497179", "model": "llama", "target_model": "claude", "recognition_score": 0.9161096075087325, "ground_truth": 0}, {"key": "29497179", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8624675194506727, "ground_truth": 0}, {"key": "29497179", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9196425251360574, "ground_truth": 0}, {"key": "35908694", "model": "llama", "target_model": "llama", "recognition_score": 0.9623913617815454, "ground_truth": 1}, {"key": "35908694", "model": "llama", "target_model": "human", "recognition_score": 0.9637799466658767, "ground_truth": 0}, {"key": "35908694", "model": "llama", "target_model": "claude", "recognition_score": 0.9496693688304035, "ground_truth": 0}, {"key": "35908694", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9449947122345738, "ground_truth": 0}, {"key": "35908694", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9632305310108501, "ground_truth": 0}, {"key": "37619358", "model": "llama", "target_model": "llama", "recognition_score": 0.581303100889381, "ground_truth": 1}, {"key": "37619358", "model": "llama", "target_model": "human", "recognition_score": 0.8164063893490501, "ground_truth": 0}, {"key": "37619358", "model": "llama", "target_model": "claude", "recognition_score": 0.6791787204759773, "ground_truth": 0}, {"key": "37619358", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5851011478400325, "ground_truth": 0}, {"key": "37619358", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6132365677850405, "ground_truth": 0}, {"key": "37293103", "model": "llama", "target_model": "llama", "recognition_score": 0.8558511483690528, "ground_truth": 1}, {"key": "37293103", "model": "llama", "target_model": "human", "recognition_score": 0.7264256232966824, "ground_truth": 0}, {"key": "37293103", "model": "llama", "target_model": "claude", "recognition_score": 0.9213576139522013, "ground_truth": 0}, {"key": "37293103", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9362850060232119, "ground_truth": 0}, {"key": "37293103", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9167080761249997, "ground_truth": 0}, {"key": "36883729", "model": "llama", "target_model": "llama", "recognition_score": 0.6619228567697294, "ground_truth": 1}, {"key": "36883729", "model": "llama", "target_model": "human", "recognition_score": 0.5389832147833911, "ground_truth": 0}, {"key": "36883729", "model": "llama", "target_model": "claude", "recognition_score": 0.4804786920876014, "ground_truth": 0}, {"key": "36883729", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7416740083418423, "ground_truth": 0}, {"key": "36883729", "model": "llama", "target_model": "gpt35", "recognition_score": 0.42632158778029855, "ground_truth": 0}, {"key": "39209521", "model": "llama", "target_model": "llama", "recognition_score": 0.7233094573728047, "ground_truth": 1}, {"key": "39209521", "model": "llama", "target_model": "human", "recognition_score": 0.8428631673637781, "ground_truth": 0}, {"key": "39209521", "model": "llama", "target_model": "claude", "recognition_score": 0.8459424270092635, "ground_truth": 0}, {"key": "39209521", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8749346299930478, "ground_truth": 0}, {"key": "39209521", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8606036184046475, "ground_truth": 0}, {"key": "27792571", "model": "llama", "target_model": "llama", "recognition_score": 0.8723473733736361, "ground_truth": 1}, {"key": "27792571", "model": "llama", "target_model": "human", "recognition_score": 0.9130583416455264, "ground_truth": 0}, {"key": "27792571", "model": "llama", "target_model": "claude", "recognition_score": 0.8558511600318053, "ground_truth": 0}, {"key": "27792571", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8879840449613025, "ground_truth": 0}, {"key": "27792571", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8783142527002751, "ground_truth": 0}, {"key": "39755647", "model": "llama", "target_model": "llama", "recognition_score": 0.8732148226687756, "ground_truth": 1}, {"key": "39755647", "model": "llama", "target_model": "human", "recognition_score": 0.9403530662044395, "ground_truth": 0}, {"key": "39755647", "model": "llama", "target_model": "claude", "recognition_score": 0.8558511460366623, "ground_truth": 0}, {"key": "39755647", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8210440990045367, "ground_truth": 0}, {"key": "39755647", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9319595765902414, "ground_truth": 0}, {"key": "40800537", "model": "llama", "target_model": "llama", "recognition_score": 0.3522017798132499, "ground_truth": 1}, {"key": "40800537", "model": "llama", "target_model": "human", "recognition_score": 0.6150878410043027, "ground_truth": 0}, {"key": "40800537", "model": "llama", "target_model": "claude", "recognition_score": 0.2674081625622251, "ground_truth": 0}, {"key": "40800537", "model": "llama", "target_model": "gpt4", "recognition_score": 0.37754065839853196, "ground_truth": 0}, {"key": "40800537", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5039061670464728, "ground_truth": 0}, {"key": "14171461", "model": "llama", "target_model": "llama", "recognition_score": 0.7981867817925009, "ground_truth": 1}, {"key": "14171461", "model": "llama", "target_model": "human", "recognition_score": 0.8289388086376276, "ground_truth": 0}, {"key": "14171461", "model": "llama", "target_model": "claude", "recognition_score": 0.8397339732576037, "ground_truth": 0}, {"key": "14171461", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8031737757671207, "ground_truth": 0}, {"key": "14171461", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7772998702913791, "ground_truth": 0}, {"key": "36892440", "model": "llama", "target_model": "llama", "recognition_score": 0.19559408541391593, "ground_truth": 1}, {"key": "36892440", "model": "llama", "target_model": "human", "recognition_score": 0.34334173024934583, "ground_truth": 0}, {"key": "36892440", "model": "llama", "target_model": "claude", "recognition_score": 0.3886179967274296, "ground_truth": 0}, {"key": "36892440", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6460137020872173, "ground_truth": 0}, {"key": "36892440", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4571367256176371, "ground_truth": 0}, {"key": "33733410", "model": "llama", "target_model": "llama", "recognition_score": 0.7401743491648709, "ground_truth": 1}, {"key": "33733410", "model": "llama", "target_model": "human", "recognition_score": 0.800691994858978, "ground_truth": 0}, {"key": "33733410", "model": "llama", "target_model": "claude", "recognition_score": 0.7534666547255334, "ground_truth": 0}, {"key": "33733410", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5945512768500263, "ground_truth": 0}, {"key": "33733410", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6842640111318635, "ground_truth": 0}, {"key": "38587765", "model": "llama", "target_model": "llama", "recognition_score": 0.4301473644033896, "ground_truth": 1}, {"key": "38587765", "model": "llama", "target_model": "human", "recognition_score": 0.5698526639967826, "ground_truth": 0}, {"key": "38587765", "model": "llama", "target_model": "claude", "recognition_score": 0.7606506616930114, "ground_truth": 0}, {"key": "38587765", "model": "llama", "target_model": "gpt4", "recognition_score": 0.20434189965087138, "ground_truth": 0}, {"key": "38587765", "model": "llama", "target_model": "gpt35", "recognition_score": 0.47073661020718394, "ground_truth": 0}, {"key": "41065582", "model": "llama", "target_model": "llama", "recognition_score": 0.7416740229194173, "ground_truth": 1}, {"key": "41065582", "model": "llama", "target_model": "human", "recognition_score": 0.5679366212542211, "ground_truth": 0}, {"key": "41065582", "model": "llama", "target_model": "claude", "recognition_score": 0.697608912295713, "ground_truth": 0}, {"key": "41065582", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6601723632854809, "ground_truth": 0}, {"key": "41065582", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5563995771796449, "ground_truth": 0}, {"key": "34713891", "model": "llama", "target_model": "llama", "recognition_score": 0.3259495275683774, "ground_truth": 1}, {"key": "34713891", "model": "llama", "target_model": "human", "recognition_score": 0.472683473782138, "ground_truth": 0}, {"key": "34713891", "model": "llama", "target_model": "claude", "recognition_score": 0.6187804184356783, "ground_truth": 0}, {"key": "34713891", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3174262812567006, "ground_truth": 0}, {"key": "34713891", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6424324728440912, "ground_truth": 0}, {"key": "18913023", "model": "llama", "target_model": "llama", "recognition_score": 0.9518632224691965, "ground_truth": 1}, {"key": "18913023", "model": "llama", "target_model": "human", "recognition_score": 0.957912271700912, "ground_truth": 0}, {"key": "18913023", "model": "llama", "target_model": "claude", "recognition_score": 0.9425067260887507, "ground_truth": 0}, {"key": "18913023", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9425067209277502, "ground_truth": 0}, {"key": "18913023", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9412234428186438, "ground_truth": 0}, {"key": "36884100", "model": "llama", "target_model": "llama", "recognition_score": 0.26894142928308745, "ground_truth": 1}, {"key": "36884100", "model": "llama", "target_model": "human", "recognition_score": 0.6842640470092315, "ground_truth": 0}, {"key": "36884100", "model": "llama", "target_model": "claude", "recognition_score": 0.33111972843044574, "ground_truth": 0}, {"key": "36884100", "model": "llama", "target_model": "gpt4", "recognition_score": 0.307358023718535, "ground_truth": 0}, {"key": "36884100", "model": "llama", "target_model": "gpt35", "recognition_score": 0.2798284982094848, "ground_truth": 0}, {"key": "39899913", "model": "llama", "target_model": "llama", "recognition_score": 0.9252299595557697, "ground_truth": 1}, {"key": "39899913", "model": "llama", "target_model": "human", "recognition_score": 0.8933094091767414, "ground_truth": 0}, {"key": "39899913", "model": "llama", "target_model": "claude", "recognition_score": 0.8799743766190936, "ground_truth": 0}, {"key": "39899913", "model": "llama", "target_model": "gpt4", "recognition_score": 0.898410550089512, "ground_truth": 0}, {"key": "39899913", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8499711740747368, "ground_truth": 0}, {"key": "30725366", "model": "llama", "target_model": "llama", "recognition_score": 0.0973904011253056, "ground_truth": 1}, {"key": "30725366", "model": "llama", "target_model": "human", "recognition_score": 0.19436781434775963, "ground_truth": 0}, {"key": "30725366", "model": "llama", "target_model": "claude", "recognition_score": 0.08509904258933029, "ground_truth": 0}, {"key": "30725366", "model": "llama", "target_model": "gpt4", "recognition_score": 0.07477004906703079, "ground_truth": 0}, {"key": "30725366", "model": "llama", "target_model": "gpt35", "recognition_score": 0.1431877096681502, "ground_truth": 0}, {"key": "26133523", "model": "llama", "target_model": "llama", "recognition_score": 0.7233094708948637, "ground_truth": 1}, {"key": "26133523", "model": "llama", "target_model": "human", "recognition_score": 0.5679366223705283, "ground_truth": 0}, {"key": "26133523", "model": "llama", "target_model": "claude", "recognition_score": 0.8697145685744864, "ground_truth": 0}, {"key": "26133523", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7185943893428383, "ground_truth": 0}, {"key": "26133523", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7732163600682529, "ground_truth": 0}, {"key": "29332665", "model": "llama", "target_model": "llama", "recognition_score": 0.86060361715266, "ground_truth": 1}, {"key": "29332665", "model": "llama", "target_model": "human", "recognition_score": 0.852935464331078, "ground_truth": 0}, {"key": "29332665", "model": "llama", "target_model": "claude", "recognition_score": 0.8365545592703372, "ground_truth": 0}, {"key": "29332665", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7969253636251841, "ground_truth": 0}, {"key": "29332665", "model": "llama", "target_model": "gpt35", "recognition_score": 0.921357625730681, "ground_truth": 0}, {"key": "37400481", "model": "llama", "target_model": "llama", "recognition_score": 0.9367494778596844, "ground_truth": 1}, {"key": "37400481", "model": "llama", "target_model": "human", "recognition_score": 0.9477691394179345, "ground_truth": 0}, {"key": "37400481", "model": "llama", "target_model": "claude", "recognition_score": 0.9469902316810663, "ground_truth": 0}, {"key": "37400481", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9635062318453385, "ground_truth": 0}, {"key": "37400481", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9155072498869737, "ground_truth": 0}, {"key": "38787241", "model": "llama", "target_model": "llama", "recognition_score": 0.7866228227979966, "ground_truth": 1}, {"key": "38787241", "model": "llama", "target_model": "human", "recognition_score": 0.7264256084891378, "ground_truth": 0}, {"key": "38787241", "model": "llama", "target_model": "claude", "recognition_score": 0.8489722082841676, "ground_truth": 0}, {"key": "38787241", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8799743696221155, "ground_truth": 0}, {"key": "38787241", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8006920048332128, "ground_truth": 0}, {"key": "38225963", "model": "llama", "target_model": "llama", "recognition_score": 0.7264256064998205, "ground_truth": 1}, {"key": "38225963", "model": "llama", "target_model": "human", "recognition_score": 0.8489721977020692, "ground_truth": 0}, {"key": "38225963", "model": "llama", "target_model": "claude", "recognition_score": 0.8438951205147739, "ground_truth": 0}, {"key": "38225963", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8697145830931482, "ground_truth": 0}, {"key": "38225963", "model": "llama", "target_model": "gpt35", "recognition_score": 0.874077223994447, "ground_truth": 0}, {"key": "26072034", "model": "llama", "target_model": "llama", "recognition_score": 0.16132022652430425, "ground_truth": 1}, {"key": "26072034", "model": "llama", "target_model": "human", "recognition_score": 0.07751765725417407, "ground_truth": 0}, {"key": "26072034", "model": "llama", "target_model": "claude", "recognition_score": 0.38121954634543453, "ground_truth": 0}, {"key": "26072034", "model": "llama", "target_model": "gpt4", "recognition_score": 0.10374862712681455, "ground_truth": 0}, {"key": "26072034", "model": "llama", "target_model": "gpt35", "recognition_score": 0.19193277491789942, "ground_truth": 0}, {"key": "35690810", "model": "llama", "target_model": "llama", "recognition_score": 0.8606036213996714, "ground_truth": 1}, {"key": "35690810", "model": "llama", "target_model": "human", "recognition_score": 0.8832359930035729, "ground_truth": 0}, {"key": "35690810", "model": "llama", "target_model": "claude", "recognition_score": 0.7718434949955801, "ground_truth": 0}, {"key": "35690810", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9309620779688423, "ground_truth": 0}, {"key": "35690810", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8991213832535668, "ground_truth": 0}, {"key": "36855665", "model": "llama", "target_model": "llama", "recognition_score": 0.9832145109706067, "ground_truth": 1}, {"key": "36855665", "model": "llama", "target_model": "human", "recognition_score": 0.9854964195702015, "ground_truth": 0}, {"key": "36855665", "model": "llama", "target_model": "claude", "recognition_score": 0.9738443834759914, "ground_truth": 0}, {"key": "36855665", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9750122079853285, "ground_truth": 0}, {"key": "36855665", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9645892699631398, "ground_truth": 0}, {"key": "29757662", "model": "llama", "target_model": "llama", "recognition_score": 0.7745833728108231, "ground_truth": 1}, {"key": "29757662", "model": "llama", "target_model": "human", "recognition_score": 0.8407825855111919, "ground_truth": 0}, {"key": "29757662", "model": "llama", "target_model": "claude", "recognition_score": 0.790530317242606, "ground_truth": 0}, {"key": "29757662", "model": "llama", "target_model": "gpt4", "recognition_score": 0.740174364416723, "ground_truth": 0}, {"key": "29757662", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5136684894780612, "ground_truth": 0}, {"key": "19134339", "model": "llama", "target_model": "llama", "recognition_score": 0.8092759948632344, "ground_truth": 1}, {"key": "19134339", "model": "llama", "target_model": "human", "recognition_score": 0.7759445320053149, "ground_truth": 0}, {"key": "19134339", "model": "llama", "target_model": "claude", "recognition_score": 0.7969253728470383, "ground_truth": 0}, {"key": "19134339", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7386690568783755, "ground_truth": 0}, {"key": "19134339", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8438950927052444, "ground_truth": 0}, {"key": "35360732", "model": "llama", "target_model": "llama", "recognition_score": 0.9372107921931097, "ground_truth": 1}, {"key": "35360732", "model": "llama", "target_model": "human", "recognition_score": 0.9390248180145037, "ground_truth": 0}, {"key": "35360732", "model": "llama", "target_model": "claude", "recognition_score": 0.9278877966220156, "ground_truth": 0}, {"key": "35360732", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8799743713156831, "ground_truth": 0}, {"key": "35360732", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8998277922336961, "ground_truth": 0}, {"key": "37713629", "model": "llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 1}, {"key": "37713629", "model": "llama", "target_model": "human", "recognition_score": 0.5926665835717645, "ground_truth": 0}, {"key": "37713629", "model": "llama", "target_model": "claude", "recognition_score": 0.4882834051473592, "ground_truth": 0}, {"key": "37713629", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5583269943160402, "ground_truth": 0}, {"key": "37713629", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5851011657530614, "ground_truth": 0}, {"key": "33393394", "model": "llama", "target_model": "llama", "recognition_score": 0.8879840417566067, "ground_truth": 1}, {"key": "33393394", "model": "llama", "target_model": "human", "recognition_score": 0.8519528024482191, "ground_truth": 0}, {"key": "33393394", "model": "llama", "target_model": "claude", "recognition_score": 0.7799929090471562, "ground_truth": 0}, {"key": "33393394", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7106283155711244, "ground_truth": 0}, {"key": "33393394", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8955226738959103, "ground_truth": 0}, {"key": "32275837", "model": "llama", "target_model": "llama", "recognition_score": 0.8661325092201332, "ground_truth": 1}, {"key": "32275837", "model": "llama", "target_model": "human", "recognition_score": 0.9525741261070841, "ground_truth": 0}, {"key": "32275837", "model": "llama", "target_model": "claude", "recognition_score": 0.9658995742050616, "ground_truth": 0}, {"key": "32275837", "model": "llama", "target_model": "gpt4", "recognition_score": 0.877476785655689, "ground_truth": 0}, {"key": "32275837", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8832359798746949, "ground_truth": 0}, {"key": "21458094", "model": "llama", "target_model": "llama", "recognition_score": 0.7248702767892603, "ground_truth": 1}, {"key": "21458094", "model": "llama", "target_model": "human", "recognition_score": 0.6424324627507053, "ground_truth": 0}, {"key": "21458094", "model": "llama", "target_model": "claude", "recognition_score": 0.726425624874158, "ground_truth": 0}, {"key": "21458094", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8187368043999673, "ground_truth": 0}, {"key": "21458094", "model": "llama", "target_model": "gpt35", "recognition_score": 0.910545398454442, "ground_truth": 0}, {"key": "40975362", "model": "llama", "target_model": "llama", "recognition_score": 0.8688267799638422, "ground_truth": 1}, {"key": "40975362", "model": "llama", "target_model": "human", "recognition_score": 0.9230391658862596, "ground_truth": 0}, {"key": "40975362", "model": "llama", "target_model": "claude", "recognition_score": 0.8539127471339033, "ground_truth": 0}, {"key": "40975362", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8832359926027477, "ground_truth": 0}, {"key": "40975362", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7956580949945884, "ground_truth": 0}, {"key": "35234201", "model": "llama", "target_model": "llama", "recognition_score": 0.9026096011771654, "ground_truth": 1}, {"key": "35234201", "model": "llama", "target_model": "human", "recognition_score": 0.8807970869136512, "ground_truth": 0}, {"key": "35234201", "model": "llama", "target_model": "claude", "recognition_score": 0.6671476869580926, "ground_truth": 0}, {"key": "35234201", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8311430574186637, "ground_truth": 0}, {"key": "35234201", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8864204067544427, "ground_truth": 0}, {"key": "36037573", "model": "llama", "target_model": "llama", "recognition_score": 0.8766343693969765, "ground_truth": 1}, {"key": "36037573", "model": "llama", "target_model": "human", "recognition_score": 0.9358173533757653, "ground_truth": 0}, {"key": "36037573", "model": "llama", "target_model": "claude", "recognition_score": 0.9358173573397109, "ground_truth": 0}, {"key": "36037573", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9073122127057787, "ground_truth": 0}, {"key": "36037573", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9319595840704199, "ground_truth": 0}, {"key": "30861915", "model": "llama", "target_model": "llama", "recognition_score": 0.9485372347693315, "ground_truth": 1}, {"key": "30861915", "model": "llama", "target_model": "human", "recognition_score": 0.9224823418070687, "ground_truth": 0}, {"key": "30861915", "model": "llama", "target_model": "claude", "recognition_score": 0.955651415252094, "ground_truth": 0}, {"key": "30861915", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9637799428059969, "ground_truth": 0}, {"key": "30861915", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9437636557685026, "ground_truth": 0}, {"key": "40173012", "model": "llama", "target_model": "llama", "recognition_score": 0.30239108662474895, "ground_truth": 1}, {"key": "40173012", "model": "llama", "target_model": "human", "recognition_score": 0.1634454275104153, "ground_truth": 0}, {"key": "40173012", "model": "llama", "target_model": "claude", "recognition_score": 0.3398276140091229, "ground_truth": 0}, {"key": "40173012", "model": "llama", "target_model": "gpt4", "recognition_score": 0.1943678251921796, "ground_truth": 0}, {"key": "40173012", "model": "llama", "target_model": "gpt35", "recognition_score": 0.23651622630725944, "ground_truth": 0}, {"key": "35100330", "model": "llama", "target_model": "llama", "recognition_score": 0.7490872104478153, "ground_truth": 1}, {"key": "35100330", "model": "llama", "target_model": "human", "recognition_score": 0.7154239963545185, "ground_truth": 0}, {"key": "35100330", "model": "llama", "target_model": "claude", "recognition_score": 0.3942009438344991, "ground_truth": 0}, {"key": "35100330", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6808786087310914, "ground_truth": 0}, {"key": "35100330", "model": "llama", "target_model": "gpt35", "recognition_score": 0.36840569691084657, "ground_truth": 0}, {"key": "37220221", "model": "llama", "target_model": "llama", "recognition_score": 0.9566342005866039, "ground_truth": 1}, {"key": "37220221", "model": "llama", "target_model": "human", "recognition_score": 0.9899086838747688, "ground_truth": 0}, {"key": "37220221", "model": "llama", "target_model": "claude", "recognition_score": 0.9546474206404862, "ground_truth": 0}, {"key": "37220221", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9339146228852844, "ground_truth": 0}, {"key": "37220221", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9511422183072492, "ground_truth": 0}, {"key": "38815218", "model": "llama", "target_model": "llama", "recognition_score": 0.9585377298388539, "ground_truth": 1}, {"key": "38815218", "model": "llama", "target_model": "human", "recognition_score": 0.9553191252532224, "ground_truth": 0}, {"key": "38815218", "model": "llama", "target_model": "claude", "recognition_score": 0.9026096039040814, "ground_truth": 0}, {"key": "38815218", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9425067217402286, "ground_truth": 0}, {"key": "38815218", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9757623656533103, "ground_truth": 0}, {"key": "39379109", "model": "llama", "target_model": "llama", "recognition_score": 0.6334102478630486, "ground_truth": 1}, {"key": "39379109", "model": "llama", "target_model": "human", "recognition_score": 0.5660185540897674, "ground_truth": 0}, {"key": "39379109", "model": "llama", "target_model": "claude", "recognition_score": 0.6757646113944499, "ground_truth": 0}, {"key": "39379109", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6774740166269736, "ground_truth": 0}, {"key": "39379109", "model": "llama", "target_model": "gpt35", "recognition_score": 0.45326184663355157, "ground_truth": 0}, {"key": "14576125", "model": "llama", "target_model": "llama", "recognition_score": 0.06465348379582869, "ground_truth": 1}, {"key": "14576125", "model": "llama", "target_model": "human", "recognition_score": 0.17106119011379914, "ground_truth": 0}, {"key": "14576125", "model": "llama", "target_model": "claude", "recognition_score": 0.10521053425255365, "ground_truth": 0}, {"key": "14576125", "model": "llama", "target_model": "gpt4", "recognition_score": 0.09670579634361465, "ground_truth": 0}, {"key": "14576125", "model": "llama", "target_model": "gpt35", "recognition_score": 0.039638841483560665, "ground_truth": 0}, {"key": "40814250", "model": "llama", "target_model": "llama", "recognition_score": 0.75055276470726, "ground_truth": 1}, {"key": "40814250", "model": "llama", "target_model": "human", "recognition_score": 0.8056321955266219, "ground_truth": 0}, {"key": "40814250", "model": "llama", "target_model": "claude", "recognition_score": 0.8333245968486859, "ground_truth": 0}, {"key": "40814250", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7371581730954104, "ground_truth": 0}, {"key": "40814250", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8428631464650387, "ground_truth": 0}, {"key": "36334488", "model": "llama", "target_model": "llama", "recognition_score": 0.5097643796130081, "ground_truth": 1}, {"key": "36334488", "model": "llama", "target_model": "human", "recognition_score": 0.6242935525451602, "ground_truth": 0}, {"key": "36334488", "model": "llama", "target_model": "claude", "recognition_score": 0.6706082690414302, "ground_truth": 0}, {"key": "36334488", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5039061773966039, "ground_truth": 0}, {"key": "36334488", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5253688139689942, "ground_truth": 0}, {"key": "36888322", "model": "llama", "target_model": "llama", "recognition_score": 0.8278281504298858, "ground_truth": 1}, {"key": "36888322", "model": "llama", "target_model": "human", "recognition_score": 0.3720487999188531, "ground_truth": 0}, {"key": "36888322", "model": "llama", "target_model": "claude", "recognition_score": 0.8624675264288741, "ground_truth": 0}, {"key": "36888322", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7057850294316995, "ground_truth": 0}, {"key": "36888322", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6893055903954499, "ground_truth": 0}, {"key": "37318916", "model": "llama", "target_model": "llama", "recognition_score": 0.9012274178620953, "ground_truth": 1}, {"key": "37318916", "model": "llama", "target_model": "human", "recognition_score": 0.9623913635703201, "ground_truth": 0}, {"key": "37318916", "model": "llama", "target_model": "claude", "recognition_score": 0.9582261249656857, "ground_truth": 0}, {"key": "37318916", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9496693661244429, "ground_truth": 0}, {"key": "37318916", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9697854102911747, "ground_truth": 0}, {"key": "39308700", "model": "llama", "target_model": "llama", "recognition_score": 0.39793841669748414, "ground_truth": 1}, {"key": "39308700", "model": "llama", "target_model": "human", "recognition_score": 0.4590761204606793, "ground_truth": 0}, {"key": "39308700", "model": "llama", "target_model": "claude", "recognition_score": 0.36477755873773393, "ground_truth": 0}, {"key": "39308700", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4863315348646975, "ground_truth": 0}, {"key": "39308700", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4532618308057951, "ground_truth": 0}, {"key": "31061543", "model": "llama", "target_model": "llama", "recognition_score": 0.7264256061968317, "ground_truth": 1}, {"key": "31061543", "model": "llama", "target_model": "human", "recognition_score": 0.9339146175434373, "ground_truth": 0}, {"key": "31061543", "model": "llama", "target_model": "claude", "recognition_score": 0.7931059460079509, "ground_truth": 0}, {"key": "31061543", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9367494760667926, "ground_truth": 0}, {"key": "31061543", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8633916098876366, "ground_truth": 0}, {"key": "37380894", "model": "llama", "target_model": "llama", "recognition_score": 0.9241418227618046, "ground_truth": 1}, {"key": "37380894", "model": "llama", "target_model": "human", "recognition_score": 0.9539660962719536, "ground_truth": 0}, {"key": "37380894", "model": "llama", "target_model": "claude", "recognition_score": 0.9462003576593059, "ground_truth": 0}, {"key": "37380894", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8940517058177172, "ground_truth": 0}, {"key": "37380894", "model": "llama", "target_model": "gpt35", "recognition_score": 0.944176858178143, "ground_truth": 0}, {"key": "38410139", "model": "llama", "target_model": "llama", "recognition_score": 0.6723316850432537, "ground_truth": 1}, {"key": "38410139", "model": "llama", "target_model": "human", "recognition_score": 0.6842640111092526, "ground_truth": 0}, {"key": "38410139", "model": "llama", "target_model": "claude", "recognition_score": 0.9353465101805905, "ground_truth": 0}, {"key": "38410139", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7074046972308, "ground_truth": 0}, {"key": "38410139", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8499711788851143, "ground_truth": 0}, {"key": "35953842", "model": "llama", "target_model": "llama", "recognition_score": 0.5448014090159232, "ground_truth": 1}, {"key": "35953842", "model": "llama", "target_model": "human", "recognition_score": 0.9039745046689942, "ground_truth": 0}, {"key": "35953842", "model": "llama", "target_model": "claude", "recognition_score": 0.8233283918891231, "ground_truth": 0}, {"key": "35953842", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7690802616653099, "ground_truth": 0}, {"key": "35953842", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8816149144754581, "ground_truth": 0}, {"key": "39815663", "model": "llama", "target_model": "llama", "recognition_score": 0.3259494839172187, "ground_truth": 1}, {"key": "39815663", "model": "llama", "target_model": "human", "recognition_score": 0.17781087369203638, "ground_truth": 0}, {"key": "39815663", "model": "llama", "target_model": "claude", "recognition_score": 0.2829881190425535, "ground_truth": 0}, {"key": "39815663", "model": "llama", "target_model": "gpt4", "recognition_score": 0.24653333957270868, "ground_truth": 0}, {"key": "39815663", "model": "llama", "target_model": "gpt35", "recognition_score": 0.14608722473056943, "ground_truth": 0}, {"key": "35121432", "model": "llama", "target_model": "llama", "recognition_score": 0.9621075702920509, "ground_truth": 1}, {"key": "35121432", "model": "llama", "target_model": "human", "recognition_score": 0.936285001452421, "ground_truth": 0}, {"key": "35121432", "model": "llama", "target_model": "claude", "recognition_score": 0.904650528618842, "ground_truth": 0}, {"key": "35121432", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8633916000154761, "ground_truth": 0}, {"key": "35121432", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9039745183504407, "ground_truth": 0}, {"key": "21712310", "model": "llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 1}, {"key": "21712310", "model": "llama", "target_model": "human", "recognition_score": 0.6740504997537118, "ground_truth": 0}, {"key": "21712310", "model": "llama", "target_model": "claude", "recognition_score": 0.6926419961895087, "ground_truth": 0}, {"key": "21712310", "model": "llama", "target_model": "gpt4", "recognition_score": 0.727975443960618, "ground_truth": 0}, {"key": "21712310", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5467381110210559, "ground_truth": 0}, {"key": "37952914", "model": "llama", "target_model": "llama", "recognition_score": 0.9105454026500621, "ground_truth": 1}, {"key": "37952914", "model": "llama", "target_model": "human", "recognition_score": 0.8887587806796011, "ground_truth": 0}, {"key": "37952914", "model": "llama", "target_model": "claude", "recognition_score": 0.9390248200798299, "ground_truth": 0}, {"key": "37952914", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7461389780411106, "ground_truth": 0}, {"key": "37952914", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8705972709352039, "ground_truth": 0}, {"key": "38956779", "model": "llama", "target_model": "llama", "recognition_score": 0.7356416411451138, "ground_truth": 1}, {"key": "38956779", "model": "llama", "target_model": "human", "recognition_score": 0.44939263606474456, "ground_truth": 0}, {"key": "38956779", "model": "llama", "target_model": "claude", "recognition_score": 0.779992897835324, "ground_truth": 0}, {"key": "38956779", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7799928988989328, "ground_truth": 0}, {"key": "38956779", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4902355953577935, "ground_truth": 0}, {"key": "36101833", "model": "llama", "target_model": "llama", "recognition_score": 0.8962513663277333, "ground_truth": 1}, {"key": "36101833", "model": "llama", "target_model": "human", "recognition_score": 0.7732163638343892, "ground_truth": 0}, {"key": "36101833", "model": "llama", "target_model": "claude", "recognition_score": 0.9329437140896437, "ground_truth": 0}, {"key": "36101833", "model": "llama", "target_model": "gpt4", "recognition_score": 0.86971458295296, "ground_truth": 0}, {"key": "36101833", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9149009557859432, "ground_truth": 0}, {"key": "35544662", "model": "llama", "target_model": "llama", "recognition_score": 0.8539127471607907, "ground_truth": 1}, {"key": "35544662", "model": "llama", "target_model": "human", "recognition_score": 0.647798227594752, "ground_truth": 0}, {"key": "35544662", "model": "llama", "target_model": "claude", "recognition_score": 0.8418256607226221, "ground_truth": 0}, {"key": "35544662", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9235923140142255, "ground_truth": 0}, {"key": "35544662", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7233094496863582, "ground_truth": 0}, {"key": "39759044", "model": "llama", "target_model": "llama", "recognition_score": 0.501953092408819, "ground_truth": 1}, {"key": "39759044", "model": "llama", "target_model": "human", "recognition_score": 0.43782351342055187, "ground_truth": 0}, {"key": "39759044", "model": "llama", "target_model": "claude", "recognition_score": 0.6424324933760142, "ground_truth": 0}, {"key": "39759044", "model": "llama", "target_model": "gpt4", "recognition_score": 0.33807714598934197, "ground_truth": 0}, {"key": "39759044", "model": "llama", "target_model": "gpt35", "recognition_score": 0.47657967871846907, "ground_truth": 0}, {"key": "39433018", "model": "llama", "target_model": "llama", "recognition_score": 0.9588471069273301, "ground_truth": 1}, {"key": "39433018", "model": "llama", "target_model": "human", "recognition_score": 0.9367494771820635, "ground_truth": 0}, {"key": "39433018", "model": "llama", "target_model": "claude", "recognition_score": 0.9196425312000708, "ground_truth": 0}, {"key": "39433018", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9453993961772346, "ground_truth": 0}, {"key": "39433018", "model": "llama", "target_model": "gpt35", "recognition_score": 0.886420401367398, "ground_truth": 0}, {"key": "22111959", "model": "llama", "target_model": "llama", "recognition_score": 0.4882833867853946, "ground_truth": 1}, {"key": "22111959", "model": "llama", "target_model": "human", "recognition_score": 0.5544705007706741, "ground_truth": 0}, {"key": "22111959", "model": "llama", "target_model": "claude", "recognition_score": 0.7416739817195129, "ground_truth": 0}, {"key": "22111959", "model": "llama", "target_model": "gpt4", "recognition_score": 0.651354855229106, "ground_truth": 0}, {"key": "22111959", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7813306229420832, "ground_truth": 0}, {"key": "38210094", "model": "llama", "target_model": "llama", "recognition_score": 0.7041601282202976, "ground_truth": 1}, {"key": "38210094", "model": "llama", "target_model": "human", "recognition_score": 0.5156199167501416, "ground_truth": 0}, {"key": "38210094", "model": "llama", "target_model": "claude", "recognition_score": 0.6808786295667382, "ground_truth": 0}, {"key": "38210094", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6601723862124548, "ground_truth": 0}, {"key": "38210094", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5409238739010003, "ground_truth": 0}, {"key": "37675935", "model": "llama", "target_model": "llama", "recognition_score": 0.7446563421400166, "ground_truth": 1}, {"key": "37675935", "model": "llama", "target_model": "human", "recognition_score": 0.6757646140375464, "ground_truth": 0}, {"key": "37675935", "model": "llama", "target_model": "claude", "recognition_score": 0.5273165341472301, "ground_truth": 0}, {"key": "37675935", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6774740232888565, "ground_truth": 0}, {"key": "37675935", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5660185212789131, "ground_truth": 0}, {"key": "35732604", "model": "llama", "target_model": "llama", "recognition_score": 0.17441028395766833, "ground_truth": 1}, {"key": "35732604", "model": "llama", "target_model": "human", "recognition_score": 0.11279540884664459, "ground_truth": 0}, {"key": "35732604", "model": "llama", "target_model": "claude", "recognition_score": 0.17781087797304454, "ground_truth": 0}, {"key": "35732604", "model": "llama", "target_model": "gpt4", "recognition_score": 0.24508501236304744, "ground_truth": 0}, {"key": "35732604", "model": "llama", "target_model": "gpt35", "recognition_score": 0.11516223784338747, "ground_truth": 0}, {"key": "27453212", "model": "llama", "target_model": "llama", "recognition_score": 0.6791786916112155, "ground_truth": 1}, {"key": "27453212", "model": "llama", "target_model": "human", "recognition_score": 0.8386797628344301, "ground_truth": 0}, {"key": "27453212", "model": "llama", "target_model": "claude", "recognition_score": 0.9012274163810934, "ground_truth": 0}, {"key": "27453212", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8175744892871643, "ground_truth": 0}, {"key": "27453212", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8918110406393993, "ground_truth": 0}, {"key": "39910047", "model": "llama", "target_model": "llama", "recognition_score": 0.721743203485913, "ground_truth": 1}, {"key": "39910047", "model": "llama", "target_model": "human", "recognition_score": 0.6566582568035793, "ground_truth": 0}, {"key": "39910047", "model": "llama", "target_model": "claude", "recognition_score": 0.6859494741701874, "ground_truth": 0}, {"key": "39910047", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7826624877968867, "ground_truth": 0}, {"key": "39910047", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7943849424946796, "ground_truth": 0}, {"key": "40054265", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819649495998, "ground_truth": 1}, {"key": "40054265", "model": "llama", "target_model": "human", "recognition_score": 0.6039318344617233, "ground_truth": 0}, {"key": "40054265", "model": "llama", "target_model": "claude", "recognition_score": 0.7592253970408355, "ground_truth": 0}, {"key": "40054265", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5983121953752328, "ground_truth": 0}, {"key": "40054265", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7386690785274453, "ground_truth": 0}, {"key": "19984615", "model": "llama", "target_model": "llama", "recognition_score": 0.4474602948157154, "ground_truth": 1}, {"key": "19984615", "model": "llama", "target_model": "human", "recognition_score": 0.5467381648710187, "ground_truth": 0}, {"key": "19984615", "model": "llama", "target_model": "claude", "recognition_score": 0.6113820214146302, "ground_truth": 0}, {"key": "19984615", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5350984482718899, "ground_truth": 0}, {"key": "19984615", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3793783834868771, "ground_truth": 0}, {"key": "16490806", "model": "llama", "target_model": "llama", "recognition_score": 0.3486451068925085, "ground_truth": 1}, {"key": "16490806", "model": "llama", "target_model": "human", "recognition_score": 0.7233094643876669, "ground_truth": 0}, {"key": "16490806", "model": "llama", "target_model": "claude", "recognition_score": 0.5214711914697021, "ground_truth": 0}, {"key": "16490806", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5983121669134029, "ground_truth": 0}, {"key": "16490806", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5350984238668, "ground_truth": 0}, {"key": "36396237", "model": "llama", "target_model": "llama", "recognition_score": 0.9704646638710054, "ground_truth": 1}, {"key": "36396237", "model": "llama", "target_model": "human", "recognition_score": 0.9717790109802459, "ground_truth": 0}, {"key": "36396237", "model": "llama", "target_model": "claude", "recognition_score": 0.9790357585277163, "ground_truth": 0}, {"key": "36396237", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9407897507600609, "ground_truth": 0}, {"key": "36396237", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9556514210409296, "ground_truth": 0}, {"key": "40726444", "model": "llama", "target_model": "llama", "recognition_score": 0.5370413626505244, "ground_truth": 1}, {"key": "40726444", "model": "llama", "target_model": "human", "recognition_score": 0.4436004037067071, "ground_truth": 0}, {"key": "40726444", "model": "llama", "target_model": "claude", "recognition_score": 0.6352224202912846, "ground_truth": 0}, {"key": "40726444", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4902355993724342, "ground_truth": 0}, {"key": "40726444", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5851011644928599, "ground_truth": 0}, {"key": "37314826", "model": "llama", "target_model": "llama", "recognition_score": 0.6654105712718298, "ground_truth": 1}, {"key": "37314826", "model": "llama", "target_model": "human", "recognition_score": 0.486331509839625, "ground_truth": 0}, {"key": "37314826", "model": "llama", "target_model": "claude", "recognition_score": 0.8723473784971314, "ground_truth": 0}, {"key": "37314826", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6206216049331359, "ground_truth": 0}, {"key": "37314826", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5926665818881911, "ground_truth": 0}, {"key": "38506971", "model": "llama", "target_model": "llama", "recognition_score": 0.7534666631943397, "ground_truth": 1}, {"key": "38506971", "model": "llama", "target_model": "human", "recognition_score": 0.7008948125628671, "ground_truth": 0}, {"key": "38506971", "model": "llama", "target_model": "claude", "recognition_score": 0.7341195376973522, "ground_truth": 0}, {"key": "38506971", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5813030984731871, "ground_truth": 0}, {"key": "38506971", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4746311435803359, "ground_truth": 0}, {"key": "40699312", "model": "llama", "target_model": "llama", "recognition_score": 0.9339146228703532, "ground_truth": 1}, {"key": "40699312", "model": "llama", "target_model": "human", "recognition_score": 0.9532750379923339, "ground_truth": 0}, {"key": "40699312", "model": "llama", "target_model": "claude", "recognition_score": 0.9053223047508665, "ground_truth": 0}, {"key": "40699312", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8210441093010997, "ground_truth": 0}, {"key": "40699312", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9005297804415447, "ground_truth": 0}, {"key": "34695474", "model": "llama", "target_model": "llama", "recognition_score": 0.8633916144660047, "ground_truth": 1}, {"key": "34695474", "model": "llama", "target_model": "human", "recognition_score": 0.8766343752206329, "ground_truth": 0}, {"key": "34695474", "model": "llama", "target_model": "claude", "recognition_score": 0.7931059487990882, "ground_truth": 0}, {"key": "34695474", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7106283293585407, "ground_truth": 0}, {"key": "34695474", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7577943779511546, "ground_truth": 0}, {"key": "36281498", "model": "llama", "target_model": "llama", "recognition_score": 0.7732163678987277, "ground_truth": 1}, {"key": "36281498", "model": "llama", "target_model": "human", "recognition_score": 0.754914974148782, "ground_truth": 0}, {"key": "36281498", "model": "llama", "target_model": "claude", "recognition_score": 0.8509646983348408, "ground_truth": 0}, {"key": "36281498", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8300437670163895, "ground_truth": 0}, {"key": "36281498", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7918210680402982, "ground_truth": 0}, {"key": "39558652", "model": "llama", "target_model": "llama", "recognition_score": 0.44939264970629106, "ground_truth": 1}, {"key": "39558652", "model": "llama", "target_model": "human", "recognition_score": 0.5525397025226699, "ground_truth": 0}, {"key": "39558652", "model": "llama", "target_model": "claude", "recognition_score": 0.7074047292993187, "ground_truth": 0}, {"key": "39558652", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7981867720872576, "ground_truth": 0}, {"key": "39558652", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8116760405182848, "ground_truth": 0}, {"key": "37330579", "model": "llama", "target_model": "llama", "recognition_score": 0.5039061745688865, "ground_truth": 1}, {"key": "37330579", "model": "llama", "target_model": "human", "recognition_score": 0.41869694086382125, "ground_truth": 0}, {"key": "37330579", "model": "llama", "target_model": "claude", "recognition_score": 0.1812632102281329, "ground_truth": 0}, {"key": "37330579", "model": "llama", "target_model": "gpt4", "recognition_score": 0.33633108793399374, "ground_truth": 0}, {"key": "37330579", "model": "llama", "target_model": "gpt35", "recognition_score": 0.48438008700483787, "ground_truth": 0}, {"key": "40547658", "model": "llama", "target_model": "llama", "recognition_score": 0.7138307399580452, "ground_truth": 1}, {"key": "40547658", "model": "llama", "target_model": "human", "recognition_score": 0.6187804258841749, "ground_truth": 0}, {"key": "40547658", "model": "llama", "target_model": "claude", "recognition_score": 0.6791787251104094, "ground_truth": 0}, {"key": "40547658", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8267118042148555, "ground_truth": 0}, {"key": "40547658", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7662936432044138, "ground_truth": 0}, {"key": "37119340", "model": "llama", "target_model": "llama", "recognition_score": 0.783988486293328, "ground_truth": 1}, {"key": "37119340", "model": "llama", "target_model": "human", "recognition_score": 0.631594309157605, "ground_truth": 0}, {"key": "37119340", "model": "llama", "target_model": "claude", "recognition_score": 0.8449215282280043, "ground_truth": 0}, {"key": "37119340", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9196425315616965, "ground_truth": 0}, {"key": "37119340", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6020615647707294, "ground_truth": 0}, {"key": "35301627", "model": "llama", "target_model": "llama", "recognition_score": 0.7264256147390177, "ground_truth": 1}, {"key": "35301627", "model": "llama", "target_model": "human", "recognition_score": 0.52731653801005, "ground_truth": 0}, {"key": "35301627", "model": "llama", "target_model": "claude", "recognition_score": 0.8459424416461829, "ground_truth": 0}, {"key": "35301627", "model": "llama", "target_model": "gpt4", "recognition_score": 0.766293645605346, "ground_truth": 0}, {"key": "35301627", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8322366677102656, "ground_truth": 0}, {"key": "34037168", "model": "llama", "target_model": "llama", "recognition_score": 0.3040416677004046, "ground_truth": 1}, {"key": "34037168", "model": "llama", "target_model": "human", "recognition_score": 0.37387581884025156, "ground_truth": 0}, {"key": "34037168", "model": "llama", "target_model": "claude", "recognition_score": 0.4130035574081124, "ground_truth": 0}, {"key": "34037168", "model": "llama", "target_model": "gpt4", "recognition_score": 0.47852883638192456, "ground_truth": 0}, {"key": "34037168", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4167966331815156, "ground_truth": 0}, {"key": "39703862", "model": "llama", "target_model": "llama", "recognition_score": 0.9669140219085405, "ground_truth": 1}, {"key": "39703862", "model": "llama", "target_model": "human", "recognition_score": 0.9597620565318301, "ground_truth": 0}, {"key": "39703862", "model": "llama", "target_model": "claude", "recognition_score": 0.981310692359276, "ground_truth": 0}, {"key": "39703862", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9732407183208893, "ground_truth": 0}, {"key": "39703862", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9546474202850573, "ground_truth": 0}, {"key": "16554814", "model": "llama", "target_model": "llama", "recognition_score": 0.7106283168306228, "ground_truth": 1}, {"key": "16554814", "model": "llama", "target_model": "human", "recognition_score": 0.808067213465708, "ground_truth": 0}, {"key": "16554814", "model": "llama", "target_model": "claude", "recognition_score": 0.7248702980272166, "ground_truth": 0}, {"key": "16554814", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7431680055685703, "ground_truth": 0}, {"key": "16554814", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5794004201391124, "ground_truth": 0}, {"key": "32983099", "model": "llama", "target_model": "llama", "recognition_score": 0.3812195590072139, "ground_truth": 1}, {"key": "32983099", "model": "llama", "target_model": "human", "recognition_score": 0.23091974910643556, "ground_truth": 0}, {"key": "32983099", "model": "llama", "target_model": "claude", "recognition_score": 0.6297745999579406, "ground_truth": 0}, {"key": "32983099", "model": "llama", "target_model": "gpt4", "recognition_score": 0.45519864299833857, "ground_truth": 0}, {"key": "32983099", "model": "llama", "target_model": "gpt35", "recognition_score": 0.37754064215320343, "ground_truth": 0}, {"key": "41072994", "model": "llama", "target_model": "llama", "recognition_score": 0.6774740300399258, "ground_truth": 1}, {"key": "41072994", "model": "llama", "target_model": "human", "recognition_score": 0.7170118693187232, "ground_truth": 0}, {"key": "41072994", "model": "llama", "target_model": "claude", "recognition_score": 0.5175708919513665, "ground_truth": 0}, {"key": "41072994", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6261241837170343, "ground_truth": 0}, {"key": "41072994", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5370414124343715, "ground_truth": 0}, {"key": "38396247", "model": "llama", "target_model": "llama", "recognition_score": 0.8940517106932795, "ground_truth": 1}, {"key": "38396247", "model": "llama", "target_model": "human", "recognition_score": 0.8757870024060798, "ground_truth": 0}, {"key": "38396247", "model": "llama", "target_model": "claude", "recognition_score": 0.9683812345172537, "ground_truth": 0}, {"key": "38396247", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9284088035268138, "ground_truth": 0}, {"key": "38396247", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9130583424187578, "ground_truth": 0}, {"key": "37507998", "model": "llama", "target_model": "llama", "recognition_score": 0.6757645729270175, "ground_truth": 1}, {"key": "37507998", "model": "llama", "target_model": "human", "recognition_score": 0.8044059273787757, "ground_truth": 0}, {"key": "37507998", "model": "llama", "target_model": "claude", "recognition_score": 0.9372107993501898, "ground_truth": 0}, {"key": "37507998", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8449215257907696, "ground_truth": 0}, {"key": "37507998", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8449215227831565, "ground_truth": 0}, {"key": "32593929", "model": "llama", "target_model": "llama", "recognition_score": 0.5389832403226084, "ground_truth": 1}, {"key": "32593929", "model": "llama", "target_model": "human", "recognition_score": 0.5370413719154158, "ground_truth": 0}, {"key": "32593929", "model": "llama", "target_model": "claude", "recognition_score": 0.6424324770678759, "ground_truth": 0}, {"key": "32593929", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5832033545454224, "ground_truth": 0}, {"key": "32593929", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6388352840179983, "ground_truth": 0}, {"key": "36056449", "model": "llama", "target_model": "llama", "recognition_score": 0.5097643791905241, "ground_truth": 1}, {"key": "36056449", "model": "llama", "target_model": "human", "recognition_score": 0.6020615653978094, "ground_truth": 0}, {"key": "36056449", "model": "llama", "target_model": "claude", "recognition_score": 0.649578607993522, "ground_truth": 0}, {"key": "36056449", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8092759756972271, "ground_truth": 0}, {"key": "36056449", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7138307483642752, "ground_truth": 0}, {"key": "21986185", "model": "llama", "target_model": "llama", "recognition_score": 0.13206615139958447, "ground_truth": 1}, {"key": "21986185", "model": "llama", "target_model": "human", "recognition_score": 0.18594720551945915, "ground_truth": 0}, {"key": "21986185", "model": "llama", "target_model": "claude", "recognition_score": 0.2365162408766622, "ground_truth": 0}, {"key": "21986185", "model": "llama", "target_model": "gpt4", "recognition_score": 0.12852512730992852, "ground_truth": 0}, {"key": "21986185", "model": "llama", "target_model": "gpt35", "recognition_score": 0.19806417866328913, "ground_truth": 0}, {"key": "40757465", "model": "llama", "target_model": "llama", "recognition_score": 0.8606036172392271, "ground_truth": 1}, {"key": "40757465", "model": "llama", "target_model": "human", "recognition_score": 0.9367494735120292, "ground_truth": 0}, {"key": "40757465", "model": "llama", "target_model": "claude", "recognition_score": 0.770464793950846, "ground_truth": 0}, {"key": "40757465", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5813031163196729, "ground_truth": 0}, {"key": "40757465", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5350984574240757, "ground_truth": 0}, {"key": "35198313", "model": "llama", "target_model": "llama", "recognition_score": 0.8104789152242252, "ground_truth": 1}, {"key": "35198313", "model": "llama", "target_model": "human", "recognition_score": 0.7217431936923486, "ground_truth": 0}, {"key": "35198313", "model": "llama", "target_model": "claude", "recognition_score": 0.7008948025263224, "ground_truth": 0}, {"key": "35198313", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8624675388322595, "ground_truth": 0}, {"key": "35198313", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6791786750588998, "ground_truth": 0}, {"key": "30604618", "model": "llama", "target_model": "llama", "recognition_score": 0.8539127537262323, "ground_truth": 1}, {"key": "30604618", "model": "llama", "target_model": "human", "recognition_score": 0.868826772951709, "ground_truth": 0}, {"key": "30604618", "model": "llama", "target_model": "claude", "recognition_score": 0.8757869795992328, "ground_truth": 0}, {"key": "30604618", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7534666376120798, "ground_truth": 0}, {"key": "30604618", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8164063603095623, "ground_truth": 0}, {"key": "35779006", "model": "llama", "target_model": "llama", "recognition_score": 0.9403530559494807, "ground_truth": 1}, {"key": "35779006", "model": "llama", "target_model": "human", "recognition_score": 0.7201715091073675, "ground_truth": 0}, {"key": "35779006", "model": "llama", "target_model": "claude", "recognition_score": 0.7356416508118397, "ground_truth": 0}, {"key": "35779006", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8140527870842406, "ground_truth": 0}, {"key": "35779006", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6242935386409936, "ground_truth": 0}, {"key": "33858956", "model": "llama", "target_model": "llama", "recognition_score": 0.8548846390342631, "ground_truth": 1}, {"key": "33858956", "model": "llama", "target_model": "human", "recognition_score": 0.8164063727058767, "ground_truth": 0}, {"key": "33858956", "model": "llama", "target_model": "claude", "recognition_score": 0.8955226807681049, "ground_truth": 0}, {"key": "33858956", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8643104476280437, "ground_truth": 0}, {"key": "33858956", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6757646050582687, "ground_truth": 0}, {"key": "38633880", "model": "llama", "target_model": "llama", "recognition_score": 0.40544871423716977, "ground_truth": 1}, {"key": "38633880", "model": "llama", "target_model": "human", "recognition_score": 0.4167966410257592, "ground_truth": 0}, {"key": "38633880", "model": "llama", "target_model": "claude", "recognition_score": 0.3647775561494478, "ground_truth": 0}, {"key": "38633880", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3345894354056796, "ground_truth": 0}, {"key": "38633880", "model": "llama", "target_model": "gpt35", "recognition_score": 0.320821298352903, "ground_truth": 0}, {"key": "36654905", "model": "llama", "target_model": "llama", "recognition_score": 0.9924812821641018, "ground_truth": 1}, {"key": "36654905", "model": "llama", "target_model": "human", "recognition_score": 0.9970878215987279, "ground_truth": 0}, {"key": "36654905", "model": "llama", "target_model": "claude", "recognition_score": 0.9939964041317394, "ground_truth": 0}, {"key": "36654905", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9759464447807239, "ground_truth": 0}, {"key": "36654905", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9695556521769652, "ground_truth": 0}, {"key": "26547482", "model": "llama", "target_model": "llama", "recognition_score": 0.5813030758097573, "ground_truth": 1}, {"key": "26547482", "model": "llama", "target_model": "human", "recognition_score": 0.4397473479119494, "ground_truth": 0}, {"key": "26547482", "model": "llama", "target_model": "claude", "recognition_score": 0.4921881483541701, "ground_truth": 0}, {"key": "26547482", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5851011715796479, "ground_truth": 0}, {"key": "26547482", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5794004159862923, "ground_truth": 0}, {"key": "36439068", "model": "llama", "target_model": "llama", "recognition_score": 0.876634380879683, "ground_truth": 1}, {"key": "36439068", "model": "llama", "target_model": "human", "recognition_score": 0.6757645802722178, "ground_truth": 0}, {"key": "36439068", "model": "llama", "target_model": "claude", "recognition_score": 0.8006919973007613, "ground_truth": 0}, {"key": "36439068", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6334102518328201, "ground_truth": 0}, {"key": "36439068", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5602526527689337, "ground_truth": 0}, {"key": "30501258", "model": "llama", "target_model": "llama", "recognition_score": 0.7490872057667823, "ground_truth": 1}, {"key": "30501258", "model": "llama", "target_model": "human", "recognition_score": 0.8233283845090799, "ground_truth": 0}, {"key": "30501258", "model": "llama", "target_model": "claude", "recognition_score": 0.6757646123460408, "ground_truth": 0}, {"key": "30501258", "model": "llama", "target_model": "gpt4", "recognition_score": 0.762070115505197, "ground_truth": 0}, {"key": "30501258", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7295198045875156, "ground_truth": 0}, {"key": "37560941", "model": "llama", "target_model": "llama", "recognition_score": 0.9433475739665592, "ground_truth": 1}, {"key": "37560941", "model": "llama", "target_model": "human", "recognition_score": 0.9465966678210368, "ground_truth": 0}, {"key": "37560941", "model": "llama", "target_model": "claude", "recognition_score": 0.8879840505806242, "ground_truth": 0}, {"key": "37560941", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9268352811451666, "ground_truth": 0}, {"key": "37560941", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9178933751180435, "ground_truth": 0}, {"key": "36801665", "model": "llama", "target_model": "llama", "recognition_score": 0.9304582568860572, "ground_truth": 1}, {"key": "36801665", "model": "llama", "target_model": "human", "recognition_score": 0.9339146152843588, "ground_truth": 0}, {"key": "36801665", "model": "llama", "target_model": "claude", "recognition_score": 0.9039745137160866, "ground_truth": 0}, {"key": "36801665", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9012274088632634, "ground_truth": 0}, {"key": "36801665", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9289263339325392, "ground_truth": 0}, {"key": "34954610", "model": "llama", "target_model": "llama", "recognition_score": 0.8198933304867091, "ground_truth": 1}, {"key": "34954610", "model": "llama", "target_model": "human", "recognition_score": 0.47463117221059326, "ground_truth": 0}, {"key": "34954610", "model": "llama", "target_model": "claude", "recognition_score": 0.7577943615945892, "ground_truth": 0}, {"key": "34954610", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5370414203439543, "ground_truth": 0}, {"key": "34954610", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8333245989192207, "ground_truth": 0}, {"key": "37020510", "model": "llama", "target_model": "llama", "recognition_score": 0.9489172670536311, "ground_truth": 1}, {"key": "37020510", "model": "llama", "target_model": "human", "recognition_score": 0.8679338451958574, "ground_truth": 0}, {"key": "37020510", "model": "llama", "target_model": "claude", "recognition_score": 0.9149009638228328, "ground_truth": 0}, {"key": "37020510", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9343951673614648, "ground_truth": 0}, {"key": "37020510", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9569571526957132, "ground_truth": 0}, {"key": "38064637", "model": "llama", "target_model": "llama", "recognition_score": 0.5755880103886034, "ground_truth": 1}, {"key": "38064637", "model": "llama", "target_model": "human", "recognition_score": 0.5583269828275567, "ground_truth": 0}, {"key": "38064637", "model": "llama", "target_model": "claude", "recognition_score": 0.26894141790774656, "ground_truth": 0}, {"key": "38064637", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2942149604857648, "ground_truth": 0}, {"key": "38064637", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4590761150383059, "ground_truth": 0}, {"key": "40886108", "model": "llama", "target_model": "llama", "recognition_score": 0.9348724562269721, "ground_truth": 1}, {"key": "40886108", "model": "llama", "target_model": "human", "recognition_score": 0.9618217290304194, "ground_truth": 0}, {"key": "40886108", "model": "llama", "target_model": "claude", "recognition_score": 0.9678992934370302, "ground_truth": 0}, {"key": "40886108", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9724147188453847, "ground_truth": 0}, {"key": "40886108", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9681411454250898, "ground_truth": 0}, {"key": "38554603", "model": "llama", "target_model": "llama", "recognition_score": 0.8558511597964938, "ground_truth": 1}, {"key": "38554603", "model": "llama", "target_model": "human", "recognition_score": 0.7772998604408903, "ground_truth": 0}, {"key": "38554603", "model": "llama", "target_model": "claude", "recognition_score": 0.7520125748413117, "ground_truth": 0}, {"key": "38554603", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7799929120840406, "ground_truth": 0}, {"key": "38554603", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8887587996053783, "ground_truth": 0}, {"key": "39115586", "model": "llama", "target_model": "llama", "recognition_score": 0.6187804438570309, "ground_truth": 1}, {"key": "39115586", "model": "llama", "target_model": "human", "recognition_score": 0.7416740092963018, "ground_truth": 0}, {"key": "39115586", "model": "llama", "target_model": "claude", "recognition_score": 0.6477982233474023, "ground_truth": 0}, {"key": "39115586", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7356416460228443, "ground_truth": 0}, {"key": "39115586", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7008948204630306, "ground_truth": 0}, {"key": "38786314", "model": "llama", "target_model": "llama", "recognition_score": 0.883235981383633, "ground_truth": 1}, {"key": "38786314", "model": "llama", "target_model": "human", "recognition_score": 0.7826624982395134, "ground_truth": 0}, {"key": "38786314", "model": "llama", "target_model": "claude", "recognition_score": 0.8519528002679824, "ground_truth": 0}, {"key": "38786314", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8311430583065025, "ground_truth": 0}, {"key": "38786314", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8633916138894374, "ground_truth": 0}, {"key": "38721078", "model": "llama", "target_model": "llama", "recognition_score": 0.9441768551414126, "ground_truth": 1}, {"key": "38721078", "model": "llama", "target_model": "human", "recognition_score": 0.9623913649511235, "ground_truth": 0}, {"key": "38721078", "model": "llama", "target_model": "claude", "recognition_score": 0.9648551518015874, "ground_truth": 0}, {"key": "38721078", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9546474168811967, "ground_truth": 0}, {"key": "38721078", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9559813530955259, "ground_truth": 0}, {"key": "39475467", "model": "llama", "target_model": "llama", "recognition_score": 0.7866228230149606, "ground_truth": 1}, {"key": "39475467", "model": "llama", "target_model": "human", "recognition_score": 0.6297746073720392, "ground_truth": 0}, {"key": "39475467", "model": "llama", "target_model": "claude", "recognition_score": 0.9314625102061598, "ground_truth": 0}, {"key": "39475467", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8267117845590621, "ground_truth": 0}, {"key": "39475467", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7853085859347653, "ground_truth": 0}, {"key": "35691234", "model": "llama", "target_model": "llama", "recognition_score": 0.8529354643865169, "ground_truth": 1}, {"key": "35691234", "model": "llama", "target_model": "human", "recognition_score": 0.6039318374708066, "ground_truth": 0}, {"key": "35691234", "model": "llama", "target_model": "claude", "recognition_score": 0.6808786335433981, "ground_truth": 0}, {"key": "35691234", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6584174971495406, "ground_truth": 0}, {"key": "35691234", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6113819830622972, "ground_truth": 0}, {"key": "36871390", "model": "llama", "target_model": "llama", "recognition_score": 0.6584174907198421, "ground_truth": 1}, {"key": "36871390", "model": "llama", "target_model": "human", "recognition_score": 0.46490158710482327, "ground_truth": 0}, {"key": "36871390", "model": "llama", "target_model": "claude", "recognition_score": 0.8902942215405001, "ground_truth": 0}, {"key": "36871390", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7201715278733292, "ground_truth": 0}, {"key": "36871390", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8056321767391283, "ground_truth": 0}, {"key": "31730844", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819413923237, "ground_truth": 1}, {"key": "31730844", "model": "llama", "target_model": "human", "recognition_score": 0.29421497574988015, "ground_truth": 0}, {"key": "31730844", "model": "llama", "target_model": "claude", "recognition_score": 0.4551986037571142, "ground_truth": 0}, {"key": "31730844", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5602526740177847, "ground_truth": 0}, {"key": "31730844", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5583269784419432, "ground_truth": 0}, {"key": "30810940", "model": "llama", "target_model": "llama", "recognition_score": 0.5907791950031003, "ground_truth": 1}, {"key": "30810940", "model": "llama", "target_model": "human", "recognition_score": 0.49804691317746314, "ground_truth": 0}, {"key": "30810940", "model": "llama", "target_model": "claude", "recognition_score": 0.6424324881353872, "ground_truth": 0}, {"key": "30810940", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7431680139780142, "ground_truth": 0}, {"key": "30810940", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6424324677172438, "ground_truth": 0}, {"key": "39352003", "model": "llama", "target_model": "llama", "recognition_score": 0.9511422221425588, "ground_truth": 1}, {"key": "39352003", "model": "llama", "target_model": "human", "recognition_score": 0.9462003535355512, "ground_truth": 0}, {"key": "39352003", "model": "llama", "target_model": "claude", "recognition_score": 0.9761291641096321, "ground_truth": 0}, {"key": "39352003", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9585377255374923, "ground_truth": 0}, {"key": "39352003", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9676556691899222, "ground_truth": 0}, {"key": "40118123", "model": "llama", "target_model": "llama", "recognition_score": 0.7138307498597924, "ground_truth": 1}, {"key": "40118123", "model": "llama", "target_model": "human", "recognition_score": 0.6976089323938652, "ground_truth": 0}, {"key": "40118123", "model": "llama", "target_model": "claude", "recognition_score": 0.5136684782080382, "ground_truth": 0}, {"key": "40118123", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5660185553817223, "ground_truth": 0}, {"key": "40118123", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6150878494600915, "ground_truth": 0}, {"key": "37114191", "model": "llama", "target_model": "llama", "recognition_score": 0.5851011742976068, "ground_truth": 1}, {"key": "37114191", "model": "llama", "target_model": "human", "recognition_score": 0.5312094044316699, "ground_truth": 0}, {"key": "37114191", "model": "llama", "target_model": "claude", "recognition_score": 0.8080672013812141, "ground_truth": 0}, {"key": "37114191", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6057990749015725, "ground_truth": 0}, {"key": "37114191", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6584175083475317, "ground_truth": 0}, {"key": "39268203", "model": "llama", "target_model": "llama", "recognition_score": 0.9429285980768182, "ground_truth": 1}, {"key": "39268203", "model": "llama", "target_model": "human", "recognition_score": 0.9066531185972032, "ground_truth": 0}, {"key": "39268203", "model": "llama", "target_model": "claude", "recognition_score": 0.8633916104779031, "ground_truth": 0}, {"key": "39268203", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8407825915148797, "ground_truth": 0}, {"key": "39268203", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8732148259491503, "ground_truth": 0}, {"key": "37950968", "model": "llama", "target_model": "llama", "recognition_score": 0.8044059197651968, "ground_truth": 1}, {"key": "37950968", "model": "llama", "target_model": "human", "recognition_score": 0.554470465404859, "ground_truth": 0}, {"key": "37950968", "model": "llama", "target_model": "claude", "recognition_score": 0.6513548649340001, "ground_truth": 0}, {"key": "37950968", "model": "llama", "target_model": "gpt4", "recognition_score": 0.695958327348763, "ground_truth": 0}, {"key": "37950968", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5926666118435718, "ground_truth": 0}, {"key": "34959807", "model": "llama", "target_model": "llama", "recognition_score": 0.8596637528240422, "ground_truth": 1}, {"key": "34959807", "model": "llama", "target_model": "human", "recognition_score": 0.7662936513334985, "ground_truth": 0}, {"key": "34959807", "model": "llama", "target_model": "claude", "recognition_score": 0.9005297759174348, "ground_truth": 0}, {"key": "34959807", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8587185976034392, "ground_truth": 0}, {"key": "34959807", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8670357506194674, "ground_truth": 0}, {"key": "35631314", "model": "llama", "target_model": "llama", "recognition_score": 0.9645892685738796, "ground_truth": 1}, {"key": "35631314", "model": "llama", "target_model": "human", "recognition_score": 0.9319595771607824, "ground_truth": 0}, {"key": "35631314", "model": "llama", "target_model": "claude", "recognition_score": 0.9656413110506044, "ground_truth": 0}, {"key": "35631314", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9612438038160257, "ground_truth": 0}, {"key": "35631314", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9572778032346683, "ground_truth": 0}, {"key": "38082365", "model": "llama", "target_model": "llama", "recognition_score": 0.9445872083318848, "ground_truth": 1}, {"key": "38082365", "model": "llama", "target_model": "human", "recognition_score": 0.9507778860443521, "ground_truth": 0}, {"key": "38082365", "model": "llama", "target_model": "claude", "recognition_score": 0.9235923164424428, "ground_truth": 0}, {"key": "38082365", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9629528256464148, "ground_truth": 0}, {"key": "38082365", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9367494738354187, "ground_truth": 0}, {"key": "37242829", "model": "llama", "target_model": "llama", "recognition_score": 0.6460136856998506, "ground_truth": 1}, {"key": "37242829", "model": "llama", "target_model": "human", "recognition_score": 0.7662936474738125, "ground_truth": 0}, {"key": "37242829", "model": "llama", "target_model": "claude", "recognition_score": 0.68930562519161, "ground_truth": 0}, {"key": "37242829", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5964331394349055, "ground_truth": 0}, {"key": "37242829", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5292633864917514, "ground_truth": 0}, {"key": "38556068", "model": "llama", "target_model": "llama", "recognition_score": 0.5156199357298074, "ground_truth": 1}, {"key": "38556068", "model": "llama", "target_model": "human", "recognition_score": 0.6601723496492377, "ground_truth": 0}, {"key": "38556068", "model": "llama", "target_model": "claude", "recognition_score": 0.7025300625224367, "ground_truth": 0}, {"key": "38556068", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7490872091370924, "ground_truth": 0}, {"key": "38556068", "model": "llama", "target_model": "gpt35", "recognition_score": 0.806852636057539, "ground_truth": 0}, {"key": "32969336", "model": "llama", "target_model": "llama", "recognition_score": 0.7931059472327211, "ground_truth": 1}, {"key": "32969336", "model": "llama", "target_model": "human", "recognition_score": 0.9086178903710157, "ground_truth": 0}, {"key": "32969336", "model": "llama", "target_model": "claude", "recognition_score": 0.7759445506779157, "ground_truth": 0}, {"key": "32969336", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7310585861553667, "ground_truth": 0}, {"key": "32969336", "model": "llama", "target_model": "gpt35", "recognition_score": 0.567936615015242, "ground_truth": 0}, {"key": "36825153", "model": "llama", "target_model": "llama", "recognition_score": 0.3998116448530887, "ground_truth": 1}, {"key": "36825153", "model": "llama", "target_model": "human", "recognition_score": 0.45326186074078584, "ground_truth": 0}, {"key": "36825153", "model": "llama", "target_model": "claude", "recognition_score": 0.5409238651655155, "ground_truth": 0}, {"key": "36825153", "model": "llama", "target_model": "gpt4", "recognition_score": 0.1285251376331023, "ground_truth": 0}, {"key": "36825153", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3757064662349693, "ground_truth": 0}, {"key": "41050146", "model": "llama", "target_model": "llama", "recognition_score": 0.9039745076978107, "ground_truth": 1}, {"key": "41050146", "model": "llama", "target_model": "human", "recognition_score": 0.9485372346738066, "ground_truth": 0}, {"key": "41050146", "model": "llama", "target_model": "claude", "recognition_score": 0.9039744997904643, "ground_truth": 0}, {"key": "41050146", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8031738006735737, "ground_truth": 0}, {"key": "41050146", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9553191277254569, "ground_truth": 0}, {"key": "27865037", "model": "llama", "target_model": "llama", "recognition_score": 0.5273165392038552, "ground_truth": 1}, {"key": "27865037", "model": "llama", "target_model": "human", "recognition_score": 0.2523840402440289, "ground_truth": 0}, {"key": "27865037", "model": "llama", "target_model": "claude", "recognition_score": 0.5234203469858791, "ground_truth": 0}, {"key": "27865037", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5945512455534373, "ground_truth": 0}, {"key": "27865037", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5660185352231638, "ground_truth": 0}, {"key": "39868565", "model": "llama", "target_model": "llama", "recognition_score": 0.8019358431098013, "ground_truth": 1}, {"key": "39868565", "model": "llama", "target_model": "human", "recognition_score": 0.7690802140467926, "ground_truth": 0}, {"key": "39868565", "model": "llama", "target_model": "claude", "recognition_score": 0.8459424488987961, "ground_truth": 0}, {"key": "39868565", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6976089521552892, "ground_truth": 0}, {"key": "39868565", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6909763072503998, "ground_truth": 0}, {"key": "37761968", "model": "llama", "target_model": "llama", "recognition_score": 0.8365545541050673, "ground_truth": 1}, {"key": "37761968", "model": "llama", "target_model": "human", "recognition_score": 0.830043768349966, "ground_truth": 0}, {"key": "37761968", "model": "llama", "target_model": "claude", "recognition_score": 0.7446563580233418, "ground_truth": 0}, {"key": "37761968", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7892336896233438, "ground_truth": 0}, {"key": "37761968", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7981867823696734, "ground_truth": 0}, {"key": "16326139", "model": "llama", "target_model": "llama", "recognition_score": 0.4726835009168923, "ground_truth": 1}, {"key": "16326139", "model": "llama", "target_model": "human", "recognition_score": 0.4263216166561388, "ground_truth": 0}, {"key": "16326139", "model": "llama", "target_model": "claude", "recognition_score": 0.36658974222171414, "ground_truth": 0}, {"key": "16326139", "model": "llama", "target_model": "gpt4", "recognition_score": 0.48242910131763506, "ground_truth": 0}, {"key": "16326139", "model": "llama", "target_model": "gpt35", "recognition_score": 0.22678363880579544, "ground_truth": 0}, {"key": "36568381", "model": "llama", "target_model": "llama", "recognition_score": 0.6808786253290939, "ground_truth": 1}, {"key": "36568381", "model": "llama", "target_model": "human", "recognition_score": 0.6893056228024129, "ground_truth": 0}, {"key": "36568381", "model": "llama", "target_model": "claude", "recognition_score": 0.8056321919477988, "ground_truth": 0}, {"key": "36568381", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8732148422883943, "ground_truth": 0}, {"key": "36568381", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7676898680232244, "ground_truth": 0}, {"key": "39855613", "model": "llama", "target_model": "llama", "recognition_score": 0.8895288353335756, "ground_truth": 1}, {"key": "39855613", "model": "llama", "target_model": "human", "recognition_score": 0.9079671351632912, "ground_truth": 0}, {"key": "39855613", "model": "llama", "target_model": "claude", "recognition_score": 0.9348724444892781, "ground_truth": 0}, {"key": "39855613", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8925625203413803, "ground_truth": 0}, {"key": "39855613", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9268352742643401, "ground_truth": 0}, {"key": "29856302", "model": "llama", "target_model": "llama", "recognition_score": 0.7279754651617402, "ground_truth": 1}, {"key": "29856302", "model": "llama", "target_model": "human", "recognition_score": 0.8386797499015058, "ground_truth": 0}, {"key": "29856302", "model": "llama", "target_model": "claude", "recognition_score": 0.6224593470571942, "ground_truth": 0}, {"key": "29856302", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7074047238190201, "ground_truth": 0}, {"key": "29856302", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6757646022976391, "ground_truth": 0}, {"key": "35641106", "model": "llama", "target_model": "llama", "recognition_score": 0.6943026724812328, "ground_truth": 1}, {"key": "35641106", "model": "llama", "target_model": "human", "recognition_score": 0.7106283071198705, "ground_truth": 0}, {"key": "35641106", "model": "llama", "target_model": "claude", "recognition_score": 0.7676898522681964, "ground_truth": 0}, {"key": "35641106", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7138307539691255, "ground_truth": 0}, {"key": "35641106", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7279754518961186, "ground_truth": 0}, {"key": "39474558", "model": "llama", "target_model": "llama", "recognition_score": 0.5331544000672017, "ground_truth": 1}, {"key": "39474558", "model": "llama", "target_model": "human", "recognition_score": 0.49023561031607893, "ground_truth": 0}, {"key": "39474558", "model": "llama", "target_model": "claude", "recognition_score": 0.5888891543797848, "ground_truth": 0}, {"key": "39474558", "model": "llama", "target_model": "gpt4", "recognition_score": 0.63341027517917, "ground_truth": 0}, {"key": "39474558", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8386797745614519, "ground_truth": 0}, {"key": "34338135", "model": "llama", "target_model": "llama", "recognition_score": 0.8705972625104753, "ground_truth": 1}, {"key": "34338135", "model": "llama", "target_model": "human", "recognition_score": 0.8255897153063585, "ground_truth": 0}, {"key": "34338135", "model": "llama", "target_model": "claude", "recognition_score": 0.9367494800452091, "ground_truth": 0}, {"key": "34338135", "model": "llama", "target_model": "gpt4", "recognition_score": 0.878314237318646, "ground_truth": 0}, {"key": "34338135", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9167080732621993, "ground_truth": 0}, {"key": "35870330", "model": "llama", "target_model": "llama", "recognition_score": 0.8856314839645681, "ground_truth": 1}, {"key": "35870330", "model": "llama", "target_model": "human", "recognition_score": 0.8469578580218875, "ground_truth": 0}, {"key": "35870330", "model": "llama", "target_model": "claude", "recognition_score": 0.8499711870446651, "ground_truth": 0}, {"key": "35870330", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9178933690225651, "ground_truth": 0}, {"key": "35870330", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8044059142766492, "ground_truth": 0}, {"key": "24478245", "model": "llama", "target_model": "llama", "recognition_score": 0.9263037318679268, "ground_truth": 1}, {"key": "24478245", "model": "llama", "target_model": "human", "recognition_score": 0.8879840535015904, "ground_truth": 0}, {"key": "24478245", "model": "llama", "target_model": "claude", "recognition_score": 0.9507778883976487, "ground_truth": 0}, {"key": "24478245", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9407897401563692, "ground_truth": 0}, {"key": "24478245", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9645892651920711, "ground_truth": 0}, {"key": "38485946", "model": "llama", "target_model": "llama", "recognition_score": 0.8783142472236113, "ground_truth": 1}, {"key": "38485946", "model": "llama", "target_model": "human", "recognition_score": 0.5292633984063049, "ground_truth": 0}, {"key": "38485946", "model": "llama", "target_model": "claude", "recognition_score": 0.6859494618970979, "ground_truth": 0}, {"key": "38485946", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9012274112676182, "ground_truth": 0}, {"key": "38485946", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8479677528489449, "ground_truth": 0}, {"key": "32509613", "model": "llama", "target_model": "llama", "recognition_score": 0.9149009432372938, "ground_truth": 1}, {"key": "32509613", "model": "llama", "target_model": "human", "recognition_score": 0.9469902334160181, "ground_truth": 0}, {"key": "32509613", "model": "llama", "target_model": "claude", "recognition_score": 0.8783142400223057, "ground_truth": 0}, {"key": "32509613", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8783142461766472, "ground_truth": 0}, {"key": "32509613", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9376689580597822, "ground_truth": 0}, {"key": "34078819", "model": "llama", "target_model": "llama", "recognition_score": 0.8723473819648127, "ground_truth": 1}, {"key": "34078819", "model": "llama", "target_model": "human", "recognition_score": 0.6477982080849275, "ground_truth": 0}, {"key": "34078819", "model": "llama", "target_model": "claude", "recognition_score": 0.9445872107165566, "ground_truth": 0}, {"key": "34078819", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8210441064340511, "ground_truth": 0}, {"key": "34078819", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9289263318669009, "ground_truth": 0}, {"key": "39523865", "model": "llama", "target_model": "llama", "recognition_score": 0.7813306055345113, "ground_truth": 1}, {"key": "39523865", "model": "llama", "target_model": "human", "recognition_score": 0.7620701184534727, "ground_truth": 0}, {"key": "39523865", "model": "llama", "target_model": "claude", "recognition_score": 0.7931059547028423, "ground_truth": 0}, {"key": "39523865", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5926665893509757, "ground_truth": 0}, {"key": "39523865", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8068526226201292, "ground_truth": 0}, {"key": "33146158", "model": "llama", "target_model": "llama", "recognition_score": 0.8615382100307271, "ground_truth": 1}, {"key": "33146158", "model": "llama", "target_model": "human", "recognition_score": 0.8311430344406168, "ground_truth": 0}, {"key": "33146158", "model": "llama", "target_model": "claude", "recognition_score": 0.8233283875957116, "ground_truth": 0}, {"key": "33146158", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8376199597587067, "ground_truth": 0}, {"key": "33146158", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7606506547689206, "ground_truth": 0}, {"key": "32083974", "model": "llama", "target_model": "llama", "recognition_score": 0.7826624743721197, "ground_truth": 1}, {"key": "32083974", "model": "llama", "target_model": "human", "recognition_score": 0.42250464289026934, "ground_truth": 0}, {"key": "32083974", "model": "llama", "target_model": "claude", "recognition_score": 0.9669140220838233, "ground_truth": 0}, {"key": "32083974", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5851011454802677, "ground_truth": 0}, {"key": "32083974", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8397339717452191, "ground_truth": 0}, {"key": "34378482", "model": "llama", "target_model": "llama", "recognition_score": 0.9543079712980207, "ground_truth": 1}, {"key": "34378482", "model": "llama", "target_model": "human", "recognition_score": 0.9742394397996811, "ground_truth": 0}, {"key": "34378482", "model": "llama", "target_model": "claude", "recognition_score": 0.973443426104543, "ground_truth": 0}, {"key": "34378482", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9334308082141533, "ground_truth": 0}, {"key": "34378482", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9492946370704979, "ground_truth": 0}, {"key": "38080102", "model": "llama", "target_model": "llama", "recognition_score": 0.592666620036949, "ground_truth": 1}, {"key": "38080102", "model": "llama", "target_model": "human", "recognition_score": 0.7981867890957093, "ground_truth": 0}, {"key": "38080102", "model": "llama", "target_model": "claude", "recognition_score": 0.7185943961743008, "ground_truth": 0}, {"key": "38080102", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7025300634921794, "ground_truth": 0}, {"key": "38080102", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6352224214525005, "ground_truth": 0}, {"key": "40244537", "model": "llama", "target_model": "llama", "recognition_score": 0.8749346180691698, "ground_truth": 1}, {"key": "40244537", "model": "llama", "target_model": "human", "recognition_score": 0.8080672023207263, "ground_truth": 0}, {"key": "40244537", "model": "llama", "target_model": "claude", "recognition_score": 0.8606036204046295, "ground_truth": 0}, {"key": "40244537", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7718434970591745, "ground_truth": 0}, {"key": "40244537", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7201715232468975, "ground_truth": 0}, {"key": "33497789", "model": "llama", "target_model": "llama", "recognition_score": 0.8969755664422969, "ground_truth": 1}, {"key": "33497789", "model": "llama", "target_model": "human", "recognition_score": 0.9559813480243465, "ground_truth": 0}, {"key": "33497789", "model": "llama", "target_model": "claude", "recognition_score": 0.9012274090630953, "ground_truth": 0}, {"key": "33497789", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8910549498290025, "ground_truth": 0}, {"key": "33497789", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9066531186906919, "ground_truth": 0}, {"key": "28816889", "model": "llama", "target_model": "llama", "recognition_score": 0.9372107905163939, "ground_truth": 1}, {"key": "28816889", "model": "llama", "target_model": "human", "recognition_score": 0.9425067174129248, "ground_truth": 0}, {"key": "28816889", "model": "llama", "target_model": "claude", "recognition_score": 0.9005297974044336, "ground_truth": 0}, {"key": "28816889", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9167080911240929, "ground_truth": 0}, {"key": "28816889", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9257686290996843, "ground_truth": 0}, {"key": "38157127", "model": "llama", "target_model": "llama", "recognition_score": 0.40168782983093604, "ground_truth": 1}, {"key": "38157127", "model": "llama", "target_model": "human", "recognition_score": 0.48633150943165265, "ground_truth": 0}, {"key": "38157127", "model": "llama", "target_model": "claude", "recognition_score": 0.08756384641805191, "ground_truth": 0}, {"key": "38157127", "model": "llama", "target_model": "gpt4", "recognition_score": 0.1824255417714771, "ground_truth": 0}, {"key": "38157127", "model": "llama", "target_model": "gpt35", "recognition_score": 0.25386101132375843, "ground_truth": 0}, {"key": "36183569", "model": "llama", "target_model": "llama", "recognition_score": 0.3007455896219375, "ground_truth": 1}, {"key": "36183569", "model": "llama", "target_model": "human", "recognition_score": 0.5926665955886902, "ground_truth": 0}, {"key": "36183569", "model": "llama", "target_model": "claude", "recognition_score": 0.6001883507072525, "ground_truth": 0}, {"key": "36183569", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4282333912239645, "ground_truth": 0}, {"key": "36183569", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "36012016", "model": "llama", "target_model": "llama", "recognition_score": 0.7476159682256939, "ground_truth": 1}, {"key": "36012016", "model": "llama", "target_model": "human", "recognition_score": 0.8705972639912556, "ground_truth": 0}, {"key": "36012016", "model": "llama", "target_model": "claude", "recognition_score": 0.8418256590003796, "ground_truth": 0}, {"key": "36012016", "model": "llama", "target_model": "gpt4", "recognition_score": 0.791821063296351, "ground_truth": 0}, {"key": "36012016", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6352224363046407, "ground_truth": 0}, {"key": "34571973", "model": "llama", "target_model": "llama", "recognition_score": 0.7386690784812471, "ground_truth": 1}, {"key": "34571973", "model": "llama", "target_model": "human", "recognition_score": 0.7341195055184797, "ground_truth": 0}, {"key": "34571973", "model": "llama", "target_model": "claude", "recognition_score": 0.8469578375036104, "ground_truth": 0}, {"key": "34571973", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7264256162260256, "ground_truth": 0}, {"key": "34571973", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7994423186939971, "ground_truth": 0}, {"key": "38707498", "model": "llama", "target_model": "llama", "recognition_score": 0.8688267709205495, "ground_truth": 1}, {"key": "38707498", "model": "llama", "target_model": "human", "recognition_score": 0.7931059539919797, "ground_truth": 0}, {"key": "38707498", "model": "llama", "target_model": "claude", "recognition_score": 0.787931189765962, "ground_truth": 0}, {"key": "38707498", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8092759861857131, "ground_truth": 0}, {"key": "38707498", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8311430442459586, "ground_truth": 0}, {"key": "35459082", "model": "llama", "target_model": "llama", "recognition_score": 0.9829546850613897, "ground_truth": 1}, {"key": "35459082", "model": "llama", "target_model": "human", "recognition_score": 0.9869795104426358, "ground_truth": 0}, {"key": "35459082", "model": "llama", "target_model": "claude", "recognition_score": 0.9700134942759734, "ground_truth": 0}, {"key": "35459082", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9880389005993918, "ground_truth": 0}, {"key": "35459082", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9629528325097615, "ground_truth": 0}, {"key": "39464041", "model": "llama", "target_model": "llama", "recognition_score": 0.9744347887868545, "ground_truth": 1}, {"key": "39464041", "model": "llama", "target_model": "human", "recognition_score": 0.9394706109761164, "ground_truth": 0}, {"key": "39464041", "model": "llama", "target_model": "claude", "recognition_score": 0.9719924780951803, "ground_truth": 0}, {"key": "39464041", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9606574960213513, "ground_truth": 0}, {"key": "39464041", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9702399069462346, "ground_truth": 0}, {"key": "23782052", "model": "llama", "target_model": "llama", "recognition_score": 0.5467381363367306, "ground_truth": 1}, {"key": "23782052", "model": "llama", "target_model": "human", "recognition_score": 0.8116760149627044, "ground_truth": 0}, {"key": "23782052", "model": "llama", "target_model": "claude", "recognition_score": 0.6531269282407824, "ground_truth": 0}, {"key": "23782052", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6352224458245607, "ground_truth": 0}, {"key": "23782052", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8791467731218592, "ground_truth": 0}, {"key": "36568455", "model": "llama", "target_model": "llama", "recognition_score": 0.8895288499901526, "ground_truth": 1}, {"key": "36568455", "model": "llama", "target_model": "human", "recognition_score": 0.9207896695402806, "ground_truth": 0}, {"key": "36568455", "model": "llama", "target_model": "claude", "recognition_score": 0.9597620605412052, "ground_truth": 0}, {"key": "36568455", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9629528294430124, "ground_truth": 0}, {"key": "36568455", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9339146187494599, "ground_truth": 0}, {"key": "38469552", "model": "llama", "target_model": "llama", "recognition_score": 0.9445872098370939, "ground_truth": 1}, {"key": "38469552", "model": "llama", "target_model": "human", "recognition_score": 0.8714748561704864, "ground_truth": 0}, {"key": "38469552", "model": "llama", "target_model": "claude", "recognition_score": 0.9219218362074424, "ground_truth": 0}, {"key": "38469552", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9606574936345664, "ground_truth": 0}, {"key": "38469552", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9324533078661235, "ground_truth": 0}, {"key": "35922277", "model": "llama", "target_model": "llama", "recognition_score": 0.9635062333003386, "ground_truth": 1}, {"key": "35922277", "model": "llama", "target_model": "human", "recognition_score": 0.9489172712436053, "ground_truth": 0}, {"key": "35922277", "model": "llama", "target_model": "claude", "recognition_score": 0.9433475711978699, "ground_truth": 0}, {"key": "35922277", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8947894578233163, "ground_truth": 0}, {"key": "35922277", "model": "llama", "target_model": "gpt35", "recognition_score": 0.95221993517733, "ground_truth": 0}, {"key": "32744293", "model": "llama", "target_model": "llama", "recognition_score": 0.8386797564707353, "ground_truth": 1}, {"key": "32744293", "model": "llama", "target_model": "human", "recognition_score": 0.8164063760028245, "ground_truth": 0}, {"key": "32744293", "model": "llama", "target_model": "claude", "recognition_score": 0.921921839728269, "ground_truth": 0}, {"key": "32744293", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7931059542632047, "ground_truth": 0}, {"key": "32744293", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7969253882048773, "ground_truth": 0}, {"key": "30972362", "model": "llama", "target_model": "llama", "recognition_score": 0.9394706084948328, "ground_truth": 1}, {"key": "30972362", "model": "llama", "target_model": "human", "recognition_score": 0.9669140240625003, "ground_truth": 0}, {"key": "30972362", "model": "llama", "target_model": "claude", "recognition_score": 0.9835969665171808, "ground_truth": 0}, {"key": "30972362", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9676556709459596, "ground_truth": 0}, {"key": "30972362", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9632305366411896, "ground_truth": 0}, {"key": "36380943", "model": "llama", "target_model": "llama", "recognition_score": 0.8688267750917081, "ground_truth": 1}, {"key": "36380943", "model": "llama", "target_model": "human", "recognition_score": 0.8807970733059866, "ground_truth": 0}, {"key": "36380943", "model": "llama", "target_model": "claude", "recognition_score": 0.8624675304397432, "ground_truth": 0}, {"key": "36380943", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8643104542474457, "ground_truth": 0}, {"key": "36380943", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8006920032886127, "ground_truth": 0}, {"key": "36929355", "model": "llama", "target_model": "llama", "recognition_score": 0.82671179450179, "ground_truth": 1}, {"key": "36929355", "model": "llama", "target_model": "human", "recognition_score": 0.7279754520718276, "ground_truth": 0}, {"key": "36929355", "model": "llama", "target_model": "claude", "recognition_score": 0.8407825936997573, "ground_truth": 0}, {"key": "36929355", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7185943713305679, "ground_truth": 0}, {"key": "36929355", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7264255920437517, "ground_truth": 0}, {"key": "39127206", "model": "llama", "target_model": "llama", "recognition_score": 0.8652240797450758, "ground_truth": 1}, {"key": "39127206", "model": "llama", "target_model": "human", "recognition_score": 0.256831988911607, "ground_truth": 0}, {"key": "39127206", "model": "llama", "target_model": "claude", "recognition_score": 0.6723317290369254, "ground_truth": 0}, {"key": "39127206", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8697145699563037, "ground_truth": 0}, {"key": "39127206", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7025300541302278, "ground_truth": 0}, {"key": "36128318", "model": "llama", "target_model": "llama", "recognition_score": 0.14414886112835928, "ground_truth": 1}, {"key": "36128318", "model": "llama", "target_model": "human", "recognition_score": 0.24653335522317457, "ground_truth": 0}, {"key": "36128318", "model": "llama", "target_model": "claude", "recognition_score": 0.19682620592470668, "ground_truth": 0}, {"key": "36128318", "model": "llama", "target_model": "gpt4", "recognition_score": 0.19314737639384824, "ground_truth": 0}, {"key": "36128318", "model": "llama", "target_model": "gpt35", "recognition_score": 0.1801066712259268, "ground_truth": 0}, {"key": "39863480", "model": "llama", "target_model": "llama", "recognition_score": 0.8824278702736905, "ground_truth": 1}, {"key": "39863480", "model": "llama", "target_model": "human", "recognition_score": 0.9213576211946246, "ground_truth": 0}, {"key": "39863480", "model": "llama", "target_model": "claude", "recognition_score": 0.9263037246494311, "ground_truth": 0}, {"key": "39863480", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8479677640097205, "ground_truth": 0}, {"key": "39863480", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9246876921043936, "ground_truth": 0}, {"key": "38634057", "model": "llama", "target_model": "llama", "recognition_score": 0.8723473775082297, "ground_truth": 1}, {"key": "38634057", "model": "llama", "target_model": "human", "recognition_score": 0.8705972655654824, "ground_truth": 0}, {"key": "38634057", "model": "llama", "target_model": "claude", "recognition_score": 0.9246876952764423, "ground_truth": 0}, {"key": "38634057", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7879311850501538, "ground_truth": 0}, {"key": "38634057", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7853085866241803, "ground_truth": 0}, {"key": "33131935", "model": "llama", "target_model": "llama", "recognition_score": 0.9219218306087472, "ground_truth": 1}, {"key": "33131935", "model": "llama", "target_model": "human", "recognition_score": 0.9348724504448352, "ground_truth": 0}, {"key": "33131935", "model": "llama", "target_model": "claude", "recognition_score": 0.9353465129048758, "ground_truth": 0}, {"key": "33131935", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9219218326094117, "ground_truth": 0}, {"key": "33131935", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9556514213587717, "ground_truth": 0}, {"key": "39021319", "model": "llama", "target_model": "llama", "recognition_score": 0.8152325078768586, "ground_truth": 1}, {"key": "39021319", "model": "llama", "target_model": "human", "recognition_score": 0.7248702524104926, "ground_truth": 0}, {"key": "39021319", "model": "llama", "target_model": "claude", "recognition_score": 0.7264255985387987, "ground_truth": 0}, {"key": "39021319", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8969755670890758, "ground_truth": 0}, {"key": "39021319", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8068526193636814, "ground_truth": 0}, {"key": "40644571", "model": "llama", "target_model": "llama", "recognition_score": 0.7520125963880346, "ground_truth": 1}, {"key": "40644571", "model": "llama", "target_model": "human", "recognition_score": 0.6976089296675196, "ground_truth": 0}, {"key": "40644571", "model": "llama", "target_model": "claude", "recognition_score": 0.7490872159895009, "ground_truth": 0}, {"key": "40644571", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6224593325616926, "ground_truth": 0}, {"key": "40644571", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7648916112432279, "ground_truth": 0}, {"key": "14681877", "model": "llama", "target_model": "llama", "recognition_score": 0.9666631784964648, "ground_truth": 1}, {"key": "14681877", "model": "llama", "target_model": "human", "recognition_score": 0.970464659240266, "ground_truth": 0}, {"key": "14681877", "model": "llama", "target_model": "claude", "recognition_score": 0.9477691382946627, "ground_truth": 0}, {"key": "14681877", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9777138163070054, "ground_truth": 0}, {"key": "14681877", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8902942316725584, "ground_truth": 0}, {"key": "36570890", "model": "llama", "target_model": "llama", "recognition_score": 0.9012274058400852, "ground_truth": 1}, {"key": "36570890", "model": "llama", "target_model": "human", "recognition_score": 0.7057850353418518, "ground_truth": 0}, {"key": "36570890", "model": "llama", "target_model": "claude", "recognition_score": 0.8376199620166206, "ground_truth": 0}, {"key": "36570890", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8587185896491311, "ground_truth": 0}, {"key": "36570890", "model": "llama", "target_model": "gpt35", "recognition_score": 0.778649314157787, "ground_truth": 0}, {"key": "30452755", "model": "llama", "target_model": "llama", "recognition_score": 0.9473810471188644, "ground_truth": 1}, {"key": "30452755", "model": "llama", "target_model": "human", "recognition_score": 0.9437636598799153, "ground_truth": 0}, {"key": "30452755", "model": "llama", "target_model": "claude", "recognition_score": 0.8879840410138866, "ground_truth": 0}, {"key": "30452755", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9381240160635467, "ground_truth": 0}, {"key": "30452755", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7826624792483741, "ground_truth": 0}, {"key": "37347053", "model": "llama", "target_model": "llama", "recognition_score": 0.7772998749949332, "ground_truth": 1}, {"key": "37347053", "model": "llama", "target_model": "human", "recognition_score": 0.8244619444971099, "ground_truth": 0}, {"key": "37347053", "model": "llama", "target_model": "claude", "recognition_score": 0.7310585654288191, "ground_truth": 0}, {"key": "37347053", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7431680104974234, "ground_truth": 0}, {"key": "37347053", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7879311893533358, "ground_truth": 0}, {"key": "38890979", "model": "llama", "target_model": "llama", "recognition_score": 0.7879312102574044, "ground_truth": 1}, {"key": "38890979", "model": "llama", "target_model": "human", "recognition_score": 0.8289388037950087, "ground_truth": 0}, {"key": "38890979", "model": "llama", "target_model": "claude", "recognition_score": 0.7185943879233359, "ground_truth": 0}, {"key": "38890979", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6808785990878577, "ground_truth": 0}, {"key": "38890979", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7476159447086573, "ground_truth": 0}, {"key": "32974694", "model": "llama", "target_model": "llama", "recognition_score": 0.7620701302878021, "ground_truth": 1}, {"key": "32974694", "model": "llama", "target_model": "human", "recognition_score": 0.9640516761040665, "ground_truth": 0}, {"key": "32974694", "model": "llama", "target_model": "claude", "recognition_score": 0.7534666788763157, "ground_truth": 0}, {"key": "32974694", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8386797582044005, "ground_truth": 0}, {"key": "32974694", "model": "llama", "target_model": "gpt35", "recognition_score": 0.907312218690554, "ground_truth": 0}, {"key": "38519940", "model": "llama", "target_model": "llama", "recognition_score": 0.9449947113891004, "ground_truth": 1}, {"key": "38519940", "model": "llama", "target_model": "human", "recognition_score": 0.8539127508910711, "ground_truth": 0}, {"key": "38519940", "model": "llama", "target_model": "claude", "recognition_score": 0.9437636496753341, "ground_truth": 0}, {"key": "38519940", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9433475757402628, "ground_truth": 0}, {"key": "38519940", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9556514219911616, "ground_truth": 0}, {"key": "38870104", "model": "llama", "target_model": "llama", "recognition_score": 0.8856314604166459, "ground_truth": 1}, {"key": "38870104", "model": "llama", "target_model": "human", "recognition_score": 0.8221891419761478, "ground_truth": 0}, {"key": "38870104", "model": "llama", "target_model": "claude", "recognition_score": 0.9111797064168241, "ground_truth": 0}, {"key": "38870104", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8940517105360491, "ground_truth": 0}, {"key": "38870104", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9412234429576521, "ground_truth": 0}, {"key": "34283161", "model": "llama", "target_model": "llama", "recognition_score": 0.6001883492724468, "ground_truth": 1}, {"key": "34283161", "model": "llama", "target_model": "human", "recognition_score": 0.8006919826711584, "ground_truth": 0}, {"key": "34283161", "model": "llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "34283161", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7279754496185777, "ground_truth": 0}, {"key": "34283161", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8289388065173312, "ground_truth": 0}, {"key": "31650463", "model": "llama", "target_model": "llama", "recognition_score": 0.8807970725629559, "ground_truth": 1}, {"key": "31650463", "model": "llama", "target_model": "human", "recognition_score": 0.9273632967426526, "ground_truth": 0}, {"key": "31650463", "model": "llama", "target_model": "claude", "recognition_score": 0.9403530580424383, "ground_truth": 0}, {"key": "31650463", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7918210620227069, "ground_truth": 0}, {"key": "31650463", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8333245974593003, "ground_truth": 0}, {"key": "35589432", "model": "llama", "target_model": "llama", "recognition_score": 0.8783142442820382, "ground_truth": 1}, {"key": "35589432", "model": "llama", "target_model": "human", "recognition_score": 0.8068526083212388, "ground_truth": 0}, {"key": "35589432", "model": "llama", "target_model": "claude", "recognition_score": 0.8679338425073098, "ground_truth": 0}, {"key": "35589432", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8428631498068339, "ground_truth": 0}, {"key": "35589432", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7310585873579294, "ground_truth": 0}, {"key": "14412752", "model": "llama", "target_model": "llama", "recognition_score": 0.87059726653762, "ground_truth": 1}, {"key": "14412752", "model": "llama", "target_model": "human", "recognition_score": 0.869714579751001, "ground_truth": 0}, {"key": "14412752", "model": "llama", "target_model": "claude", "recognition_score": 0.7676898616664981, "ground_truth": 0}, {"key": "14412752", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8529354830124438, "ground_truth": 0}, {"key": "14412752", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8031738099970458, "ground_truth": 0}, {"key": "37271183", "model": "llama", "target_model": "llama", "recognition_score": 0.9824231151026344, "ground_truth": 1}, {"key": "37271183", "model": "llama", "target_model": "human", "recognition_score": 0.9817357207907024, "ground_truth": 0}, {"key": "37271183", "model": "llama", "target_model": "claude", "recognition_score": 0.9815951085191806, "ground_truth": 0}, {"key": "37271183", "model": "llama", "target_model": "gpt4", "recognition_score": 0.985042914235099, "ground_truth": 0}, {"key": "37271183", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9890976268107208, "ground_truth": 0}, {"key": "35588153", "model": "llama", "target_model": "llama", "recognition_score": 0.9522199312388889, "ground_truth": 1}, {"key": "35588153", "model": "llama", "target_model": "human", "recognition_score": 0.9814534363623482, "ground_truth": 0}, {"key": "35588153", "model": "llama", "target_model": "claude", "recognition_score": 0.9713473285573448, "ground_truth": 0}, {"key": "35588153", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9496693663857825, "ground_truth": 0}, {"key": "35588153", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9343951722917401, "ground_truth": 0}, {"key": "39876692", "model": "llama", "target_model": "llama", "recognition_score": 0.9462003488077567, "ground_truth": 1}, {"key": "39876692", "model": "llama", "target_model": "human", "recognition_score": 0.878314246109357, "ground_truth": 0}, {"key": "39876692", "model": "llama", "target_model": "claude", "recognition_score": 0.8697145898434077, "ground_truth": 0}, {"key": "39876692", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8848377734093675, "ground_truth": 0}, {"key": "39876692", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8529354760156257, "ground_truth": 0}, {"key": "38992323", "model": "llama", "target_model": "llama", "recognition_score": 0.8991213687129902, "ground_truth": 1}, {"key": "38992323", "model": "llama", "target_model": "human", "recognition_score": 0.898410547854201, "ground_truth": 0}, {"key": "38992323", "model": "llama", "target_model": "claude", "recognition_score": 0.9178933755175326, "ground_truth": 0}, {"key": "38992323", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7690802545646843, "ground_truth": 0}, {"key": "38992323", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8140528024820366, "ground_truth": 0}, {"key": "37556002", "model": "llama", "target_model": "llama", "recognition_score": 0.7592254018107627, "ground_truth": 1}, {"key": "37556002", "model": "llama", "target_model": "human", "recognition_score": 0.7295197706845077, "ground_truth": 0}, {"key": "37556002", "model": "llama", "target_model": "claude", "recognition_score": 0.8783142585896813, "ground_truth": 0}, {"key": "37556002", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9167080687552577, "ground_truth": 0}, {"key": "37556002", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8864204085117313, "ground_truth": 0}, {"key": "39875801", "model": "llama", "target_model": "llama", "recognition_score": 0.8519528049186962, "ground_truth": 1}, {"key": "39875801", "model": "llama", "target_model": "human", "recognition_score": 0.8832359876251711, "ground_truth": 0}, {"key": "39875801", "model": "llama", "target_model": "claude", "recognition_score": 0.920789677479162, "ground_truth": 0}, {"key": "39875801", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9458012699658228, "ground_truth": 0}, {"key": "39875801", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9348724519256387, "ground_truth": 0}, {"key": "39272285", "model": "llama", "target_model": "llama", "recognition_score": 0.3293917371640167, "ground_truth": 1}, {"key": "39272285", "model": "llama", "target_model": "human", "recognition_score": 0.2553436580779644, "ground_truth": 0}, {"key": "39272285", "model": "llama", "target_model": "claude", "recognition_score": 0.3775406822935367, "ground_truth": 0}, {"key": "39272285", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4397473408181851, "ground_truth": 0}, {"key": "39272285", "model": "llama", "target_model": "gpt35", "recognition_score": 0.33285232143939797, "ground_truth": 0}, {"key": "39629714", "model": "llama", "target_model": "llama", "recognition_score": 0.8489721918447612, "ground_truth": 1}, {"key": "39629714", "model": "llama", "target_model": "human", "recognition_score": 0.8615382022982432, "ground_truth": 0}, {"key": "39629714", "model": "llama", "target_model": "claude", "recognition_score": 0.6842640212636948, "ground_truth": 0}, {"key": "39629714", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9155072467391124, "ground_truth": 0}, {"key": "39629714", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6406358697978426, "ground_truth": 0}, {"key": "34043257", "model": "llama", "target_model": "llama", "recognition_score": 0.882427871293106, "ground_truth": 1}, {"key": "34043257", "model": "llama", "target_model": "human", "recognition_score": 0.8311430368205689, "ground_truth": 0}, {"key": "34043257", "model": "llama", "target_model": "claude", "recognition_score": 0.913676531127978, "ground_truth": 0}, {"key": "34043257", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9294404134661712, "ground_truth": 0}, {"key": "34043257", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8333245877684836, "ground_truth": 0}, {"key": "33995240", "model": "llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 1}, {"key": "33995240", "model": "llama", "target_model": "human", "recognition_score": 0.7745833951032391, "ground_truth": 0}, {"key": "33995240", "model": "llama", "target_model": "claude", "recognition_score": 0.8322366589444486, "ground_truth": 0}, {"key": "33995240", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4746311486535588, "ground_truth": 0}, {"key": "33995240", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6825737121921868, "ground_truth": 0}, {"key": "39399948", "model": "llama", "target_model": "llama", "recognition_score": 0.9640516764614747, "ground_truth": 1}, {"key": "39399948", "model": "llama", "target_model": "human", "recognition_score": 0.8723473841115793, "ground_truth": 0}, {"key": "39399948", "model": "llama", "target_model": "claude", "recognition_score": 0.9118099574049479, "ground_truth": 0}, {"key": "39399948", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9441768582970087, "ground_truth": 0}, {"key": "39399948", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8902942237950029, "ground_truth": 0}, {"key": "33185890", "model": "llama", "target_model": "llama", "recognition_score": 0.8816148951563836, "ground_truth": 1}, {"key": "33185890", "model": "llama", "target_model": "human", "recognition_score": 0.7592254224974441, "ground_truth": 0}, {"key": "33185890", "model": "llama", "target_model": "claude", "recognition_score": 0.8558511442326551, "ground_truth": 0}, {"key": "33185890", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8244619188249365, "ground_truth": 0}, {"key": "33185890", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8697145873014455, "ground_truth": 0}, {"key": "35280425", "model": "llama", "target_model": "llama", "recognition_score": 0.9385759587616634, "ground_truth": 1}, {"key": "35280425", "model": "llama", "target_model": "human", "recognition_score": 0.8539127561845652, "ground_truth": 0}, {"key": "35280425", "model": "llama", "target_model": "claude", "recognition_score": 0.8872045981404825, "ground_truth": 0}, {"key": "35280425", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9569571473461539, "ground_truth": 0}, {"key": "35280425", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9367494797427438, "ground_truth": 0}, {"key": "16365170", "model": "llama", "target_model": "llama", "recognition_score": 0.9390248163723153, "ground_truth": 1}, {"key": "16365170", "model": "llama", "target_model": "human", "recognition_score": 0.9529258222975373, "ground_truth": 0}, {"key": "16365170", "model": "llama", "target_model": "claude", "recognition_score": 0.9492946381478263, "ground_truth": 0}, {"key": "16365170", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8947894532024254, "ground_truth": 0}, {"key": "16365170", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9372107915318676, "ground_truth": 0}, {"key": "24388238", "model": "llama", "target_model": "llama", "recognition_score": 0.6893056036458657, "ground_truth": 1}, {"key": "24388238", "model": "llama", "target_model": "human", "recognition_score": 0.8233283968522266, "ground_truth": 0}, {"key": "24388238", "model": "llama", "target_model": "claude", "recognition_score": 0.7943849554789523, "ground_truth": 0}, {"key": "24388238", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8864204040533803, "ground_truth": 0}, {"key": "24388238", "model": "llama", "target_model": "gpt35", "recognition_score": 0.793105957173385, "ground_truth": 0}, {"key": "35024827", "model": "llama", "target_model": "llama", "recognition_score": 0.8529354800900713, "ground_truth": 1}, {"key": "35024827", "model": "llama", "target_model": "human", "recognition_score": 0.6859494597019573, "ground_truth": 0}, {"key": "35024827", "model": "llama", "target_model": "claude", "recognition_score": 0.8449215405962094, "ground_truth": 0}, {"key": "35024827", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7799929042131759, "ground_truth": 0}, {"key": "35024827", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6876300021855826, "ground_truth": 0}, {"key": "38624944", "model": "llama", "target_model": "llama", "recognition_score": 0.842863153809644, "ground_truth": 1}, {"key": "38624944", "model": "llama", "target_model": "human", "recognition_score": 0.9453993922860469, "ground_truth": 0}, {"key": "38624944", "model": "llama", "target_model": "claude", "recognition_score": 0.7918210605381928, "ground_truth": 0}, {"key": "38624944", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9268352739119757, "ground_truth": 0}, {"key": "38624944", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8955226679192319, "ground_truth": 0}, {"key": "34719830", "model": "llama", "target_model": "llama", "recognition_score": 0.8679338517504228, "ground_truth": 1}, {"key": "34719830", "model": "llama", "target_model": "human", "recognition_score": 0.9778834117629337, "ground_truth": 0}, {"key": "34719830", "model": "llama", "target_model": "claude", "recognition_score": 0.9612438041435353, "ground_truth": 0}, {"key": "34719830", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9485372288971223, "ground_truth": 0}, {"key": "34719830", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8679338396194037, "ground_truth": 0}, {"key": "38995225", "model": "llama", "target_model": "llama", "recognition_score": 0.3433417238302667, "ground_truth": 1}, {"key": "38995225", "model": "llama", "target_model": "human", "recognition_score": 0.6531268820823335, "ground_truth": 0}, {"key": "38995225", "model": "llama", "target_model": "claude", "recognition_score": 0.5273165487203425, "ground_truth": 0}, {"key": "38995225", "model": "llama", "target_model": "gpt4", "recognition_score": 0.461016759019083, "ground_truth": 0}, {"key": "38995225", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5097644000507117, "ground_truth": 0}, {"key": "34242311", "model": "llama", "target_model": "llama", "recognition_score": 0.8587185841284538, "ground_truth": 1}, {"key": "34242311", "model": "llama", "target_model": "human", "recognition_score": 0.7676898547144112, "ground_truth": 0}, {"key": "34242311", "model": "llama", "target_model": "claude", "recognition_score": 0.8418256459179286, "ground_truth": 0}, {"key": "34242311", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9026096110436724, "ground_truth": 0}, {"key": "34242311", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8895288500511899, "ground_truth": 0}, {"key": "39253748", "model": "llama", "target_model": "llama", "recognition_score": 0.9059898191171584, "ground_truth": 1}, {"key": "39253748", "model": "llama", "target_model": "human", "recognition_score": 0.8848377723080675, "ground_truth": 0}, {"key": "39253748", "model": "llama", "target_model": "claude", "recognition_score": 0.887204602114634, "ground_truth": 0}, {"key": "39253748", "model": "llama", "target_model": "gpt4", "recognition_score": 0.920789674364611, "ground_truth": 0}, {"key": "39253748", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9324533078183347, "ground_truth": 0}, {"key": "37131104", "model": "llama", "target_model": "llama", "recognition_score": 0.988222156438066, "ground_truth": 1}, {"key": "37131104", "model": "llama", "target_model": "human", "recognition_score": 0.9895916852886938, "ground_truth": 0}, {"key": "37131104", "model": "llama", "target_model": "claude", "recognition_score": 0.9924227581842535, "ground_truth": 0}, {"key": "37131104", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9851575822540045, "ground_truth": 0}, {"key": "37131104", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9908743620979737, "ground_truth": 0}, {"key": "38490554", "model": "llama", "target_model": "llama", "recognition_score": 0.9381240172095662, "ground_truth": 1}, {"key": "38490554", "model": "llama", "target_model": "human", "recognition_score": 0.923039158374626, "ground_truth": 0}, {"key": "38490554", "model": "llama", "target_model": "claude", "recognition_score": 0.9278877962469528, "ground_truth": 0}, {"key": "38490554", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9782188284725564, "ground_truth": 0}, {"key": "38490554", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9563089418042651, "ground_truth": 0}, {"key": "29009500", "model": "llama", "target_model": "llama", "recognition_score": 0.4436004327322599, "ground_truth": 1}, {"key": "29009500", "model": "llama", "target_model": "human", "recognition_score": 0.6334102712037862, "ground_truth": 0}, {"key": "29009500", "model": "llama", "target_model": "claude", "recognition_score": 0.6671476616594202, "ground_truth": 0}, {"key": "29009500", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3007455621729904, "ground_truth": 0}, {"key": "29009500", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5331543957622579, "ground_truth": 0}, {"key": "36703057", "model": "llama", "target_model": "llama", "recognition_score": 0.875786993983919, "ground_truth": 1}, {"key": "36703057", "model": "llama", "target_model": "human", "recognition_score": 0.8092759574271964, "ground_truth": 0}, {"key": "36703057", "model": "llama", "target_model": "claude", "recognition_score": 0.8080672236714167, "ground_truth": 0}, {"key": "36703057", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8679338500129222, "ground_truth": 0}, {"key": "36703057", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7386690762768949, "ground_truth": 0}, {"key": "34876987", "model": "llama", "target_model": "llama", "recognition_score": 0.9536217965547337, "ground_truth": 1}, {"key": "34876987", "model": "llama", "target_model": "human", "recognition_score": 0.9579122719716157, "ground_truth": 0}, {"key": "34876987", "model": "llama", "target_model": "claude", "recognition_score": 0.906653115927157, "ground_truth": 0}, {"key": "34876987", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9465966712575554, "ground_truth": 0}, {"key": "34876987", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9556514167785614, "ground_truth": 0}, {"key": "36209258", "model": "llama", "target_model": "llama", "recognition_score": 0.8740772363102316, "ground_truth": 1}, {"key": "36209258", "model": "llama", "target_model": "human", "recognition_score": 0.9173026615348578, "ground_truth": 0}, {"key": "36209258", "model": "llama", "target_model": "claude", "recognition_score": 0.9086178926810569, "ground_truth": 0}, {"key": "36209258", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7969253859877601, "ground_truth": 0}, {"key": "36209258", "model": "llama", "target_model": "gpt35", "recognition_score": 0.709019145961977, "ground_truth": 0}, {"key": "36854437", "model": "llama", "target_model": "llama", "recognition_score": 0.407333387166805, "ground_truth": 1}, {"key": "36854437", "model": "llama", "target_model": "human", "recognition_score": 0.4921881259245977, "ground_truth": 0}, {"key": "36854437", "model": "llama", "target_model": "claude", "recognition_score": 0.43782346330027805, "ground_truth": 0}, {"key": "36854437", "model": "llama", "target_model": "gpt4", "recognition_score": 0.30735801805677615, "ground_truth": 0}, {"key": "36854437", "model": "llama", "target_model": "gpt35", "recognition_score": 0.42059957495842293, "ground_truth": 0}, {"key": "38047723", "model": "llama", "target_model": "llama", "recognition_score": 0.22815651206186185, "ground_truth": 1}, {"key": "38047723", "model": "llama", "target_model": "human", "recognition_score": 0.22135068429065208, "ground_truth": 0}, {"key": "38047723", "model": "llama", "target_model": "claude", "recognition_score": 0.15002881327832357, "ground_truth": 0}, {"key": "38047723", "model": "llama", "target_model": "gpt4", "recognition_score": 0.22270013046499693, "ground_truth": 0}, {"key": "38047723", "model": "llama", "target_model": "gpt35", "recognition_score": 0.27512972965319804, "ground_truth": 0}, {"key": "34287816", "model": "llama", "target_model": "llama", "recognition_score": 0.6424324661288484, "ground_truth": 1}, {"key": "34287816", "model": "llama", "target_model": "human", "recognition_score": 0.6859494532740774, "ground_truth": 0}, {"key": "34287816", "model": "llama", "target_model": "claude", "recognition_score": 0.732591818034747, "ground_truth": 0}, {"key": "34287816", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8311430463607389, "ground_truth": 0}, {"key": "34287816", "model": "llama", "target_model": "gpt35", "recognition_score": 0.759225415352073, "ground_truth": 0}, {"key": "33235855", "model": "llama", "target_model": "llama", "recognition_score": 0.9706877691513928, "ground_truth": 1}, {"key": "33235855", "model": "llama", "target_model": "human", "recognition_score": 0.9681411504911822, "ground_truth": 0}, {"key": "33235855", "model": "llama", "target_model": "claude", "recognition_score": 0.9742394400566811, "ground_truth": 0}, {"key": "33235855", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9828232915078364, "ground_truth": 0}, {"key": "33235855", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9771973639708271, "ground_truth": 0}, {"key": "34381016", "model": "llama", "target_model": "llama", "recognition_score": 0.885631468208582, "ground_truth": 1}, {"key": "34381016", "model": "llama", "target_model": "human", "recognition_score": 0.9339146234991067, "ground_truth": 0}, {"key": "34381016", "model": "llama", "target_model": "claude", "recognition_score": 0.9263037206248932, "ground_truth": 0}, {"key": "34381016", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9284088086861568, "ground_truth": 0}, {"key": "34381016", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7892336849321794, "ground_truth": 0}, {"key": "28064995", "model": "llama", "target_model": "llama", "recognition_score": 0.831143051888337, "ground_truth": 1}, {"key": "28064995", "model": "llama", "target_model": "human", "recognition_score": 0.8991213697254121, "ground_truth": 0}, {"key": "28064995", "model": "llama", "target_model": "claude", "recognition_score": 0.7662936288282074, "ground_truth": 0}, {"key": "28064995", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8116760257000842, "ground_truth": 0}, {"key": "28064995", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8322366610027376, "ground_truth": 0}, {"key": "37576197", "model": "llama", "target_model": "llama", "recognition_score": 0.6297746115697087, "ground_truth": 1}, {"key": "37576197", "model": "llama", "target_model": "human", "recognition_score": 0.6150878449228767, "ground_truth": 0}, {"key": "37576197", "model": "llama", "target_model": "claude", "recognition_score": 0.6842640063255022, "ground_truth": 0}, {"key": "37576197", "model": "llama", "target_model": "gpt4", "recognition_score": 0.661922862306831, "ground_truth": 0}, {"key": "37576197", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4186969112372235, "ground_truth": 0}, {"key": "34454741", "model": "llama", "target_model": "llama", "recognition_score": 0.7217431958776248, "ground_truth": 1}, {"key": "34454741", "model": "llama", "target_model": "human", "recognition_score": 0.6825737114003964, "ground_truth": 0}, {"key": "34454741", "model": "llama", "target_model": "claude", "recognition_score": 0.7090191176697377, "ground_truth": 0}, {"key": "34454741", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6150878582891944, "ground_truth": 0}, {"key": "34454741", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5506073700906814, "ground_truth": 0}, {"key": "34766970", "model": "llama", "target_model": "llama", "recognition_score": 0.6909762845805635, "ground_truth": 1}, {"key": "34766970", "model": "llama", "target_model": "human", "recognition_score": 0.6406358570305503, "ground_truth": 0}, {"key": "34766970", "model": "llama", "target_model": "claude", "recognition_score": 0.341582507159584, "ground_truth": 0}, {"key": "34766970", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7461389958152203, "ground_truth": 0}, {"key": "34766970", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5486734703580683, "ground_truth": 0}, {"key": "35574186", "model": "llama", "target_model": "llama", "recognition_score": 0.9289263307679787, "ground_truth": 1}, {"key": "35574186", "model": "llama", "target_model": "human", "recognition_score": 0.7826624864292429, "ground_truth": 0}, {"key": "35574186", "model": "llama", "target_model": "claude", "recognition_score": 0.8652241005708625, "ground_truth": 0}, {"key": "35574186", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9178933754851378, "ground_truth": 0}, {"key": "35574186", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8933093985191295, "ground_truth": 0}, {"key": "35486470", "model": "llama", "target_model": "llama", "recognition_score": 0.7994423291730477, "ground_truth": 1}, {"key": "35486470", "model": "llama", "target_model": "human", "recognition_score": 0.6513548545218313, "ground_truth": 0}, {"key": "35486470", "model": "llama", "target_model": "claude", "recognition_score": 0.7956581037580723, "ground_truth": 0}, {"key": "35486470", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7233094691748612, "ground_truth": 0}, {"key": "35486470", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6531269293791965, "ground_truth": 0}, {"key": "40977702", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819552721517, "ground_truth": 1}, {"key": "40977702", "model": "llama", "target_model": "human", "recognition_score": 0.6261241821371746, "ground_truth": 0}, {"key": "40977702", "model": "llama", "target_model": "claude", "recognition_score": 0.6442251262529541, "ground_truth": 0}, {"key": "40977702", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4804786375576753, "ground_truth": 0}, {"key": "40977702", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7690802275096232, "ground_truth": 0}, {"key": "35336618", "model": "llama", "target_model": "llama", "recognition_score": 0.9324533090490493, "ground_truth": 1}, {"key": "35336618", "model": "llama", "target_model": "human", "recognition_score": 0.902609606212852, "ground_truth": 0}, {"key": "35336618", "model": "llama", "target_model": "claude", "recognition_score": 0.9213576196771781, "ground_truth": 0}, {"key": "35336618", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9161096121453097, "ground_truth": 0}, {"key": "35336618", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9348724553717331, "ground_truth": 0}, {"key": "33024679", "model": "llama", "target_model": "llama", "recognition_score": 0.7676898473426331, "ground_truth": 1}, {"key": "33024679", "model": "llama", "target_model": "human", "recognition_score": 0.7248702691029321, "ground_truth": 0}, {"key": "33024679", "model": "llama", "target_model": "claude", "recognition_score": 0.8311430515794194, "ground_truth": 0}, {"key": "33024679", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7461389903873749, "ground_truth": 0}, {"key": "33024679", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8633916064555459, "ground_truth": 0}, {"key": "37451334", "model": "llama", "target_model": "llama", "recognition_score": 0.6352224379905507, "ground_truth": 1}, {"key": "37451334", "model": "llama", "target_model": "human", "recognition_score": 0.7745833775474418, "ground_truth": 0}, {"key": "37451334", "model": "llama", "target_model": "claude", "recognition_score": 0.9124361571159314, "ground_truth": 0}, {"key": "37451334", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8267117991579972, "ground_truth": 0}, {"key": "37451334", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8991213777118823, "ground_truth": 0}, {"key": "33354824", "model": "llama", "target_model": "llama", "recognition_score": 0.6095241732538558, "ground_truth": 1}, {"key": "33354824", "model": "llama", "target_model": "human", "recognition_score": 0.7170118748362239, "ground_truth": 0}, {"key": "33354824", "model": "llama", "target_model": "claude", "recognition_score": 0.4111108494996425, "ground_truth": 0}, {"key": "33354824", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5945512889708033, "ground_truth": 0}, {"key": "33354824", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4416730041025084, "ground_truth": 0}, {"key": "34688538", "model": "llama", "target_model": "llama", "recognition_score": 0.7416740312911907, "ground_truth": 1}, {"key": "34688538", "model": "llama", "target_model": "human", "recognition_score": 0.6992544136008341, "ground_truth": 0}, {"key": "34688538", "model": "llama", "target_model": "claude", "recognition_score": 0.7931059515899577, "ground_truth": 0}, {"key": "34688538", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8092759814249824, "ground_truth": 0}, {"key": "34688538", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7505527536822797, "ground_truth": 0}, {"key": "33646276", "model": "llama", "target_model": "llama", "recognition_score": 0.4746311844818192, "ground_truth": 1}, {"key": "33646276", "model": "llama", "target_model": "human", "recognition_score": 0.5195213178391777, "ground_truth": 0}, {"key": "33646276", "model": "llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "33646276", "model": "llama", "target_model": "gpt4", "recognition_score": 0.36116470095391356, "ground_truth": 0}, {"key": "33646276", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6842640474464551, "ground_truth": 0}, {"key": "40322608", "model": "llama", "target_model": "llama", "recognition_score": 0.9202179890417636, "ground_truth": 1}, {"key": "40322608", "model": "llama", "target_model": "human", "recognition_score": 0.8469578408509437, "ground_truth": 0}, {"key": "40322608", "model": "llama", "target_model": "claude", "recognition_score": 0.9563089381486184, "ground_truth": 0}, {"key": "40322608", "model": "llama", "target_model": "gpt4", "recognition_score": 0.861538208397689, "ground_truth": 0}, {"key": "40322608", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9473810503451383, "ground_truth": 0}, {"key": "39565762", "model": "llama", "target_model": "llama", "recognition_score": 0.9525741288398869, "ground_truth": 1}, {"key": "39565762", "model": "llama", "target_model": "human", "recognition_score": 0.9469902232338264, "ground_truth": 0}, {"key": "39565762", "model": "llama", "target_model": "claude", "recognition_score": 0.7431680174282161, "ground_truth": 0}, {"key": "39565762", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9618217236714206, "ground_truth": 0}, {"key": "39565762", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8832359740040013, "ground_truth": 0}, {"key": "30534259", "model": "llama", "target_model": "llama", "recognition_score": 0.9372107920975625, "ground_truth": 1}, {"key": "30534259", "model": "llama", "target_model": "human", "recognition_score": 0.8210441315430742, "ground_truth": 0}, {"key": "30534259", "model": "llama", "target_model": "claude", "recognition_score": 0.7956581047194116, "ground_truth": 0}, {"key": "30534259", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8499711739824966, "ground_truth": 0}, {"key": "30534259", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7918210761137974, "ground_truth": 0}, {"key": "39644242", "model": "llama", "target_model": "llama", "recognition_score": 0.9173026485640313, "ground_truth": 1}, {"key": "39644242", "model": "llama", "target_model": "human", "recognition_score": 0.7154239800750491, "ground_truth": 0}, {"key": "39644242", "model": "llama", "target_model": "claude", "recognition_score": 0.9294404017979825, "ground_truth": 0}, {"key": "39644242", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8962513739268647, "ground_truth": 0}, {"key": "39644242", "model": "llama", "target_model": "gpt35", "recognition_score": 0.857768101344431, "ground_truth": 0}, {"key": "19853740", "model": "llama", "target_model": "llama", "recognition_score": 0.8233284123805905, "ground_truth": 1}, {"key": "19853740", "model": "llama", "target_model": "human", "recognition_score": 0.7918210684275537, "ground_truth": 0}, {"key": "19853740", "model": "llama", "target_model": "claude", "recognition_score": 0.9263037327198491, "ground_truth": 0}, {"key": "19853740", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8322366567022162, "ground_truth": 0}, {"key": "19853740", "model": "llama", "target_model": "gpt35", "recognition_score": 0.901227411570595, "ground_truth": 0}, {"key": "33023078", "model": "llama", "target_model": "llama", "recognition_score": 0.9207896892063908, "ground_truth": 1}, {"key": "33023078", "model": "llama", "target_model": "human", "recognition_score": 0.9334308037626957, "ground_truth": 0}, {"key": "33023078", "model": "llama", "target_model": "claude", "recognition_score": 0.8714748547184146, "ground_truth": 0}, {"key": "33023078", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9358173542404485, "ground_truth": 0}, {"key": "33023078", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9394706062656536, "ground_truth": 0}, {"key": "38329806", "model": "llama", "target_model": "llama", "recognition_score": 0.44746030368269935, "ground_truth": 1}, {"key": "38329806", "model": "llama", "target_model": "human", "recognition_score": 0.4130036005525814, "ground_truth": 0}, {"key": "38329806", "model": "llama", "target_model": "claude", "recognition_score": 0.5214711766410595, "ground_truth": 0}, {"key": "38329806", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5156199291469743, "ground_truth": 0}, {"key": "38329806", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4282333764522903, "ground_truth": 0}, {"key": "38761942", "model": "llama", "target_model": "llama", "recognition_score": 0.694302684266849, "ground_truth": 1}, {"key": "38761942", "model": "llama", "target_model": "human", "recognition_score": 0.682573752325878, "ground_truth": 0}, {"key": "38761942", "model": "llama", "target_model": "claude", "recognition_score": 0.8080672166437316, "ground_truth": 0}, {"key": "38761942", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7918210804832078, "ground_truth": 0}, {"key": "38761942", "model": "llama", "target_model": "gpt35", "recognition_score": 0.535098400909525, "ground_truth": 0}, {"key": "33773576", "model": "llama", "target_model": "llama", "recognition_score": 0.5832033382854716, "ground_truth": 1}, {"key": "33773576", "model": "llama", "target_model": "human", "recognition_score": 0.8947894754856694, "ground_truth": 0}, {"key": "33773576", "model": "llama", "target_model": "claude", "recognition_score": 0.660172384684199, "ground_truth": 0}, {"key": "33773576", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7264255936975966, "ground_truth": 0}, {"key": "33773576", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8344068770791516, "ground_truth": 0}, {"key": "37642631", "model": "llama", "target_model": "llama", "recognition_score": 0.7476159556666675, "ground_truth": 1}, {"key": "37642631", "model": "llama", "target_model": "human", "recognition_score": 0.8267118045969034, "ground_truth": 0}, {"key": "37642631", "model": "llama", "target_model": "claude", "recognition_score": 0.6388352760566082, "ground_truth": 0}, {"key": "37642631", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8006919981882381, "ground_truth": 0}, {"key": "37642631", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6601723822481546, "ground_truth": 0}, {"key": "36609836", "model": "llama", "target_model": "llama", "recognition_score": 0.9124361573334558, "ground_truth": 1}, {"key": "36609836", "model": "llama", "target_model": "human", "recognition_score": 0.899121384987492, "ground_truth": 0}, {"key": "36609836", "model": "llama", "target_model": "claude", "recognition_score": 0.9603611602341368, "ground_truth": 0}, {"key": "36609836", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9367494783901639, "ground_truth": 0}, {"key": "36609836", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8624675322975494, "ground_truth": 0}, {"key": "41035610", "model": "llama", "target_model": "llama", "recognition_score": 0.7356416486573433, "ground_truth": 1}, {"key": "41035610", "model": "llama", "target_model": "human", "recognition_score": 0.847967760394343, "ground_truth": 0}, {"key": "41035610", "model": "llama", "target_model": "claude", "recognition_score": 0.7704647798430466, "ground_truth": 0}, {"key": "41035610", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7490872211577553, "ground_truth": 0}, {"key": "41035610", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8006920146350461, "ground_truth": 0}, {"key": "37592684", "model": "llama", "target_model": "llama", "recognition_score": 0.8068526395440844, "ground_truth": 1}, {"key": "37592684", "model": "llama", "target_model": "human", "recognition_score": 0.9032942071232697, "ground_truth": 0}, {"key": "37592684", "model": "llama", "target_model": "claude", "recognition_score": 0.8714748506610043, "ground_truth": 0}, {"key": "37592684", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9485372322132712, "ground_truth": 0}, {"key": "37592684", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9184802556709631, "ground_truth": 0}, {"key": "38951040", "model": "llama", "target_model": "llama", "recognition_score": 0.89256252969362, "ground_truth": 1}, {"key": "38951040", "model": "llama", "target_model": "human", "recognition_score": 0.6723317074675877, "ground_truth": 0}, {"key": "38951040", "model": "llama", "target_model": "claude", "recognition_score": 0.8397339710640169, "ground_truth": 0}, {"key": "38951040", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7356416363310009, "ground_truth": 0}, {"key": "38951040", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8244619533689529, "ground_truth": 0}, {"key": "40774469", "model": "llama", "target_model": "llama", "recognition_score": 0.18594718184084233, "ground_truth": 1}, {"key": "40774469", "model": "llama", "target_model": "human", "recognition_score": 0.11357958720910542, "ground_truth": 0}, {"key": "40774469", "model": "llama", "target_model": "claude", "recognition_score": 0.3647775519490132, "ground_truth": 0}, {"key": "40774469", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4765796390473985, "ground_truth": 0}, {"key": "40774469", "model": "llama", "target_model": "gpt35", "recognition_score": 0.36477753611785263, "ground_truth": 0}, {"key": "40876288", "model": "llama", "target_model": "llama", "recognition_score": 0.92630372682851, "ground_truth": 1}, {"key": "40876288", "model": "llama", "target_model": "human", "recognition_score": 0.8438950976092833, "ground_truth": 0}, {"key": "40876288", "model": "llama", "target_model": "claude", "recognition_score": 0.7772998684255935, "ground_truth": 0}, {"key": "40876288", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7446563271569009, "ground_truth": 0}, {"key": "40876288", "model": "llama", "target_model": "gpt35", "recognition_score": 0.672331676759881, "ground_truth": 0}, {"key": "40340131", "model": "llama", "target_model": "llama", "recognition_score": 0.9184802454538314, "ground_truth": 1}, {"key": "40340131", "model": "llama", "target_model": "human", "recognition_score": 0.938124015202801, "ground_truth": 0}, {"key": "40340131", "model": "llama", "target_model": "claude", "recognition_score": 0.851952811014618, "ground_truth": 0}, {"key": "40340131", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9376689648455888, "ground_truth": 0}, {"key": "40340131", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9348724567136528, "ground_truth": 0}, {"key": "30121591", "model": "llama", "target_model": "llama", "recognition_score": 0.838679759915744, "ground_truth": 1}, {"key": "30121591", "model": "llama", "target_model": "human", "recognition_score": 0.8577681113295134, "ground_truth": 0}, {"key": "30121591", "model": "llama", "target_model": "claude", "recognition_score": 0.6206216063855167, "ground_truth": 0}, {"key": "30121591", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9263037275878863, "ground_truth": 0}, {"key": "30121591", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9399133433103501, "ground_truth": 0}, {"key": "35623366", "model": "llama", "target_model": "llama", "recognition_score": 0.8661325094552851, "ground_truth": 1}, {"key": "35623366", "model": "llama", "target_model": "human", "recognition_score": 0.6513548662743451, "ground_truth": 0}, {"key": "35623366", "model": "llama", "target_model": "claude", "recognition_score": 0.8969755684326726, "ground_truth": 0}, {"key": "35623366", "model": "llama", "target_model": "gpt4", "recognition_score": 0.865224085675828, "ground_truth": 0}, {"key": "35623366", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8962513705078216, "ground_truth": 0}, {"key": "41014093", "model": "llama", "target_model": "llama", "recognition_score": 0.7461389768383954, "ground_truth": 1}, {"key": "41014093", "model": "llama", "target_model": "human", "recognition_score": 0.7732163797172669, "ground_truth": 0}, {"key": "41014093", "model": "llama", "target_model": "claude", "recognition_score": 0.86703575881432, "ground_truth": 0}, {"key": "41014093", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8615382102009923, "ground_truth": 0}, {"key": "41014093", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7772998716307878, "ground_truth": 0}, {"key": "11387984", "model": "llama", "target_model": "llama", "recognition_score": 0.8714748639871782, "ground_truth": 1}, {"key": "11387984", "model": "llama", "target_model": "human", "recognition_score": 0.7704647952418859, "ground_truth": 0}, {"key": "11387984", "model": "llama", "target_model": "claude", "recognition_score": 0.9207896745870615, "ground_truth": 0}, {"key": "11387984", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7759445471161255, "ground_truth": 0}, {"key": "11387984", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7662936591937297, "ground_truth": 0}, {"key": "39508312", "model": "llama", "target_model": "llama", "recognition_score": 0.8019358350852835, "ground_truth": 1}, {"key": "39508312", "model": "llama", "target_model": "human", "recognition_score": 0.7892336949845021, "ground_truth": 0}, {"key": "39508312", "model": "llama", "target_model": "claude", "recognition_score": 0.8386797529134805, "ground_truth": 0}, {"key": "39508312", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8311430489380403, "ground_truth": 0}, {"key": "39508312", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8152324826222348, "ground_truth": 0}, {"key": "35815369", "model": "llama", "target_model": "llama", "recognition_score": 0.6334102508380494, "ground_truth": 1}, {"key": "35815369", "model": "llama", "target_model": "human", "recognition_score": 0.7662936467125612, "ground_truth": 0}, {"key": "35815369", "model": "llama", "target_model": "claude", "recognition_score": 0.7170118837014597, "ground_truth": 0}, {"key": "35815369", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8175744622801704, "ground_truth": 0}, {"key": "35815369", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7799928995790204, "ground_truth": 0}, {"key": "35802823", "model": "llama", "target_model": "llama", "recognition_score": 0.7956580926453195, "ground_truth": 1}, {"key": "35802823", "model": "llama", "target_model": "human", "recognition_score": 0.6113819911124085, "ground_truth": 0}, {"key": "35802823", "model": "llama", "target_model": "claude", "recognition_score": 0.8918110494840424, "ground_truth": 0}, {"key": "35802823", "model": "llama", "target_model": "gpt4", "recognition_score": 0.59455127393624, "ground_truth": 0}, {"key": "35802823", "model": "llama", "target_model": "gpt35", "recognition_score": 0.720171487769521, "ground_truth": 0}, {"key": "38499968", "model": "llama", "target_model": "llama", "recognition_score": 0.9105454014768007, "ground_truth": 1}, {"key": "38499968", "model": "llama", "target_model": "human", "recognition_score": 0.8615382249128959, "ground_truth": 0}, {"key": "38499968", "model": "llama", "target_model": "claude", "recognition_score": 0.9099069981625979, "ground_truth": 0}, {"key": "38499968", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8322366431185503, "ground_truth": 0}, {"key": "38499968", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9284088022847407, "ground_truth": 0}, {"key": "36926726", "model": "llama", "target_model": "llama", "recognition_score": 0.8365545694471874, "ground_truth": 1}, {"key": "36926726", "model": "llama", "target_model": "human", "recognition_score": 0.9257686237226486, "ground_truth": 0}, {"key": "36926726", "model": "llama", "target_model": "claude", "recognition_score": 0.9099069984633561, "ground_truth": 0}, {"key": "36926726", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9224823363354077, "ground_truth": 0}, {"key": "36926726", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9099070031742748, "ground_truth": 0}, {"key": "40903712", "model": "llama", "target_model": "llama", "recognition_score": 0.8499711777442638, "ground_truth": 1}, {"key": "40903712", "model": "llama", "target_model": "human", "recognition_score": 0.9190632892612053, "ground_truth": 0}, {"key": "40903712", "model": "llama", "target_model": "claude", "recognition_score": 0.857768100588295, "ground_truth": 0}, {"key": "40903712", "model": "llama", "target_model": "gpt4", "recognition_score": 0.930962075605976, "ground_truth": 0}, {"key": "40903712", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8749346120071739, "ground_truth": 0}, {"key": "19614862", "model": "llama", "target_model": "llama", "recognition_score": 0.9268352800315397, "ground_truth": 1}, {"key": "19614862", "model": "llama", "target_model": "human", "recognition_score": 0.4882833976951445, "ground_truth": 0}, {"key": "19614862", "model": "llama", "target_model": "claude", "recognition_score": 0.8479677712785174, "ground_truth": 0}, {"key": "19614862", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7732163531633605, "ground_truth": 0}, {"key": "19614862", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5214711367672972, "ground_truth": 0}, {"key": "38861704", "model": "llama", "target_model": "llama", "recognition_score": 0.6619228708086815, "ground_truth": 1}, {"key": "38861704", "model": "llama", "target_model": "human", "recognition_score": 0.7520125782286947, "ground_truth": 0}, {"key": "38861704", "model": "llama", "target_model": "claude", "recognition_score": 0.6406358580144079, "ground_truth": 0}, {"key": "38861704", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6688802565319126, "ground_truth": 0}, {"key": "38861704", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7956581231446856, "ground_truth": 0}, {"key": "34349607", "model": "llama", "target_model": "llama", "recognition_score": 0.5926665947373952, "ground_truth": 1}, {"key": "34349607", "model": "llama", "target_model": "human", "recognition_score": 0.7041601200054993, "ground_truth": 0}, {"key": "34349607", "model": "llama", "target_model": "claude", "recognition_score": 0.613236548682607, "ground_truth": 0}, {"key": "34349607", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4902356136675703, "ground_truth": 0}, {"key": "34349607", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6654105479709419, "ground_truth": 0}, {"key": "20773800", "model": "llama", "target_model": "llama", "recognition_score": 0.27825679117279545, "ground_truth": 1}, {"key": "20773800", "model": "llama", "target_model": "human", "recognition_score": 0.10594827579189427, "ground_truth": 0}, {"key": "20773800", "model": "llama", "target_model": "claude", "recognition_score": 0.08819004438340862, "ground_truth": 0}, {"key": "20773800", "model": "llama", "target_model": "gpt4", "recognition_score": 0.10818895552197356, "ground_truth": 0}, {"key": "20773800", "model": "llama", "target_model": "gpt35", "recognition_score": 0.17328820282526375, "ground_truth": 0}, {"key": "35545608", "model": "llama", "target_model": "llama", "recognition_score": 0.6976089019187118, "ground_truth": 1}, {"key": "35545608", "model": "llama", "target_model": "human", "recognition_score": 0.6495786086107109, "ground_truth": 0}, {"key": "35545608", "model": "llama", "target_model": "claude", "recognition_score": 0.5851011564845569, "ground_truth": 0}, {"key": "35545608", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7534666594497774, "ground_truth": 0}, {"key": "35545608", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7461389901801944, "ground_truth": 0}, {"key": "37258984", "model": "llama", "target_model": "llama", "recognition_score": 0.6460137093884526, "ground_truth": 1}, {"key": "37258984", "model": "llama", "target_model": "human", "recognition_score": 0.4746311717774807, "ground_truth": 0}, {"key": "37258984", "model": "llama", "target_model": "claude", "recognition_score": 0.6584175022652189, "ground_truth": 0}, {"key": "37258984", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3960681448002564, "ground_truth": 0}, {"key": "37258984", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7956581001368271, "ground_truth": 0}, {"key": "37274562", "model": "llama", "target_model": "llama", "recognition_score": 0.8902942200430242, "ground_truth": 1}, {"key": "37274562", "model": "llama", "target_model": "human", "recognition_score": 0.8723473849902771, "ground_truth": 0}, {"key": "37274562", "model": "llama", "target_model": "claude", "recognition_score": 0.8697145822312561, "ground_truth": 0}, {"key": "37274562", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9032941987011743, "ground_truth": 0}, {"key": "37274562", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8643104669263756, "ground_truth": 0}, {"key": "40828068", "model": "llama", "target_model": "llama", "recognition_score": 0.9263037256078762, "ground_truth": 1}, {"key": "40828068", "model": "llama", "target_model": "human", "recognition_score": 0.9339146230942007, "ground_truth": 0}, {"key": "40828068", "model": "llama", "target_model": "claude", "recognition_score": 0.9362850037468683, "ground_truth": 0}, {"key": "40828068", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8749346291815802, "ground_truth": 0}, {"key": "40828068", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9477691419534849, "ground_truth": 0}, {"key": "37807180", "model": "llama", "target_model": "llama", "recognition_score": 0.8233283861377884, "ground_truth": 1}, {"key": "37807180", "model": "llama", "target_model": "human", "recognition_score": 0.8300437620151532, "ground_truth": 0}, {"key": "37807180", "model": "llama", "target_model": "claude", "recognition_score": 0.9073122237768383, "ground_truth": 0}, {"key": "37807180", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8633915973468309, "ground_truth": 0}, {"key": "37807180", "model": "llama", "target_model": "gpt35", "recognition_score": 0.840782597377959, "ground_truth": 0}, {"key": "40748607", "model": "llama", "target_model": "llama", "recognition_score": 0.983722539597987, "ground_truth": 1}, {"key": "40748607", "model": "llama", "target_model": "human", "recognition_score": 0.9868787291269274, "ground_truth": 0}, {"key": "40748607", "model": "llama", "target_model": "claude", "recognition_score": 0.9876638986805083, "ground_truth": 0}, {"key": "40748607", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9900635818491195, "ground_truth": 0}, {"key": "40748607", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9866748517165239, "ground_truth": 0}, {"key": "40123819", "model": "llama", "target_model": "llama", "recognition_score": 0.9394706124423281, "ground_truth": 1}, {"key": "40123819", "model": "llama", "target_model": "human", "recognition_score": 0.9496693618872595, "ground_truth": 0}, {"key": "40123819", "model": "llama", "target_model": "claude", "recognition_score": 0.9678992894610451, "ground_truth": 0}, {"key": "40123819", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9559813472564439, "ground_truth": 0}, {"key": "40123819", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9257686282711072, "ground_truth": 0}, {"key": "38453867", "model": "llama", "target_model": "llama", "recognition_score": 0.8529354725810061, "ground_truth": 1}, {"key": "38453867", "model": "llama", "target_model": "human", "recognition_score": 0.779992903603178, "ground_truth": 0}, {"key": "38453867", "model": "llama", "target_model": "claude", "recognition_score": 0.7813306260359187, "ground_truth": 0}, {"key": "38453867", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7892336958332486, "ground_truth": 0}, {"key": "38453867", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8175744846908874, "ground_truth": 0}, {"key": "38944856", "model": "llama", "target_model": "llama", "recognition_score": 0.9224823431659865, "ground_truth": 1}, {"key": "38944856", "model": "llama", "target_model": "human", "recognition_score": 0.9433475776401866, "ground_truth": 0}, {"key": "38944856", "model": "llama", "target_model": "claude", "recognition_score": 0.931462506833031, "ground_truth": 0}, {"key": "38944856", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9469902316868165, "ground_truth": 0}, {"key": "38944856", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8386797532283065, "ground_truth": 0}, {"key": "35778898", "model": "llama", "target_model": "llama", "recognition_score": 0.9385759546484183, "ground_truth": 1}, {"key": "35778898", "model": "llama", "target_model": "human", "recognition_score": 0.9656413106220089, "ground_truth": 0}, {"key": "35778898", "model": "llama", "target_model": "claude", "recognition_score": 0.9518632305087186, "ground_truth": 0}, {"key": "35778898", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9603611606302807, "ground_truth": 0}, {"key": "35778898", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9612438021912484, "ground_truth": 0}, {"key": "32530125", "model": "llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 1}, {"key": "32530125", "model": "llama", "target_model": "human", "recognition_score": 0.34158250529198336, "ground_truth": 0}, {"key": "32530125", "model": "llama", "target_model": "claude", "recognition_score": 0.23370634376315827, "ground_truth": 0}, {"key": "32530125", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4785288139928191, "ground_truth": 0}, {"key": "32530125", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3629691921892561, "ground_truth": 0}, {"key": "35010363", "model": "llama", "target_model": "llama", "recognition_score": 0.7201715159907579, "ground_truth": 1}, {"key": "35010363", "model": "llama", "target_model": "human", "recognition_score": 0.6406358717829556, "ground_truth": 0}, {"key": "35010363", "model": "llama", "target_model": "claude", "recognition_score": 0.7676898594443219, "ground_truth": 0}, {"key": "35010363", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7074046863987574, "ground_truth": 0}, {"key": "35010363", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6959583394432777, "ground_truth": 0}, {"key": "27514800", "model": "llama", "target_model": "llama", "recognition_score": 0.9019206818093253, "ground_truth": 1}, {"key": "27514800", "model": "llama", "target_model": "human", "recognition_score": 0.8933094025705407, "ground_truth": 0}, {"key": "27514800", "model": "llama", "target_model": "claude", "recognition_score": 0.9566342050769259, "ground_truth": 0}, {"key": "27514800", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8221891297332131, "ground_truth": 0}, {"key": "27514800", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9032942047542178, "ground_truth": 0}, {"key": "25725840", "model": "llama", "target_model": "llama", "recognition_score": 0.14318771202877145, "ground_truth": 1}, {"key": "25725840", "model": "llama", "target_model": "human", "recognition_score": 0.20181322566555923, "ground_truth": 0}, {"key": "25725840", "model": "llama", "target_model": "claude", "recognition_score": 0.4167966341445722, "ground_truth": 0}, {"key": "25725840", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4649015498953927, "ground_truth": 0}, {"key": "25725840", "model": "llama", "target_model": "gpt35", "recognition_score": 0.24653333907263433, "ground_truth": 0}, {"key": "38327225", "model": "llama", "target_model": "llama", "recognition_score": 0.6992544330121793, "ground_truth": 1}, {"key": "38327225", "model": "llama", "target_model": "human", "recognition_score": 0.544801409268975, "ground_truth": 0}, {"key": "38327225", "model": "llama", "target_model": "claude", "recognition_score": 0.5486734965009347, "ground_truth": 0}, {"key": "38327225", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4687906233257925, "ground_truth": 0}, {"key": "38327225", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7662936293940451, "ground_truth": 0}, {"key": "11991724", "model": "llama", "target_model": "llama", "recognition_score": 0.9637799401673923, "ground_truth": 1}, {"key": "11991724", "model": "llama", "target_model": "human", "recognition_score": 0.9284087948878488, "ground_truth": 0}, {"key": "11991724", "model": "llama", "target_model": "claude", "recognition_score": 0.9416541581315989, "ground_truth": 0}, {"key": "11991724", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8887587959267601, "ground_truth": 0}, {"key": "11991724", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9465966722529465, "ground_truth": 0}, {"key": "32217545", "model": "llama", "target_model": "llama", "recognition_score": 0.9213576159040745, "ground_truth": 1}, {"key": "32217545", "model": "llama", "target_model": "human", "recognition_score": 0.8333246073301944, "ground_truth": 0}, {"key": "32217545", "model": "llama", "target_model": "claude", "recognition_score": 0.9458012699853297, "ground_truth": 0}, {"key": "32217545", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8080672155533009, "ground_truth": 0}, {"key": "32217545", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9136765253943283, "ground_truth": 0}, {"key": "12731847", "model": "llama", "target_model": "llama", "recognition_score": 0.7853085736682069, "ground_truth": 1}, {"key": "12731847", "model": "llama", "target_model": "human", "recognition_score": 0.8056322015562377, "ground_truth": 0}, {"key": "12731847", "model": "llama", "target_model": "claude", "recognition_score": 0.6943026649713426, "ground_truth": 0}, {"key": "12731847", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7264256446893403, "ground_truth": 0}, {"key": "12731847", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7520125946080259, "ground_truth": 0}, {"key": "36827234", "model": "llama", "target_model": "llama", "recognition_score": 0.9289263283622402, "ground_truth": 1}, {"key": "36827234", "model": "llama", "target_model": "human", "recognition_score": 0.8615382071270682, "ground_truth": 0}, {"key": "36827234", "model": "llama", "target_model": "claude", "recognition_score": 0.9492946364840332, "ground_truth": 0}, {"key": "36827234", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9294404093483359, "ground_truth": 0}, {"key": "36827234", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9235923219139334, "ground_truth": 0}, {"key": "29111539", "model": "llama", "target_model": "llama", "recognition_score": 0.9149009520461562, "ground_truth": 1}, {"key": "29111539", "model": "llama", "target_model": "human", "recognition_score": 0.8354835574029187, "ground_truth": 0}, {"key": "29111539", "model": "llama", "target_model": "claude", "recognition_score": 0.9202179794463459, "ground_truth": 0}, {"key": "29111539", "model": "llama", "target_model": "gpt4", "recognition_score": 0.939913355302156, "ground_truth": 0}, {"key": "29111539", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9518632263243819, "ground_truth": 0}, {"key": "37763052", "model": "llama", "target_model": "llama", "recognition_score": 0.6636689560256963, "ground_truth": 1}, {"key": "37763052", "model": "llama", "target_model": "human", "recognition_score": 0.7813306129122941, "ground_truth": 0}, {"key": "37763052", "model": "llama", "target_model": "claude", "recognition_score": 0.9445872024263422, "ground_truth": 0}, {"key": "37763052", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8244619158617822, "ground_truth": 0}, {"key": "37763052", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8652240765736638, "ground_truth": 0}, {"key": "30682335", "model": "llama", "target_model": "llama", "recognition_score": 0.7563575975393114, "ground_truth": 1}, {"key": "30682335", "model": "llama", "target_model": "human", "recognition_score": 0.6619228986368594, "ground_truth": 0}, {"key": "30682335", "model": "llama", "target_model": "claude", "recognition_score": 0.7416740134851094, "ground_truth": 0}, {"key": "30682335", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5273165106445153, "ground_truth": 0}, {"key": "30682335", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7279754617889848, "ground_truth": 0}, {"key": "12261276", "model": "llama", "target_model": "llama", "recognition_score": 0.0753123039607775, "ground_truth": 1}, {"key": "12261276", "model": "llama", "target_model": "human", "recognition_score": 0.37022540007101257, "ground_truth": 0}, {"key": "12261276", "model": "llama", "target_model": "claude", "recognition_score": 0.18126320582024924, "ground_truth": 0}, {"key": "12261276", "model": "llama", "target_model": "gpt4", "recognition_score": 0.11920292989594794, "ground_truth": 0}, {"key": "12261276", "model": "llama", "target_model": "gpt35", "recognition_score": 0.252384032899302, "ground_truth": 0}, {"key": "36912979", "model": "llama", "target_model": "llama", "recognition_score": 0.8376199710610197, "ground_truth": 1}, {"key": "36912979", "model": "llama", "target_model": "human", "recognition_score": 0.44939260140432186, "ground_truth": 0}, {"key": "36912979", "model": "llama", "target_model": "claude", "recognition_score": 0.5945512716558834, "ground_truth": 0}, {"key": "36912979", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4765796409477569, "ground_truth": 0}, {"key": "36912979", "model": "llama", "target_model": "gpt35", "recognition_score": 0.44939263894217996, "ground_truth": 0}, {"key": "30205259", "model": "llama", "target_model": "llama", "recognition_score": 0.8705972679048758, "ground_truth": 1}, {"key": "30205259", "model": "llama", "target_model": "human", "recognition_score": 0.8615382106741432, "ground_truth": 0}, {"key": "30205259", "model": "llama", "target_model": "claude", "recognition_score": 0.9118099567006505, "ground_truth": 0}, {"key": "30205259", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8848377749822083, "ground_truth": 0}, {"key": "30205259", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8529354873794961, "ground_truth": 0}, {"key": "39458032", "model": "llama", "target_model": "llama", "recognition_score": 0.9932550109623797, "ground_truth": 1}, {"key": "39458032", "model": "llama", "target_model": "human", "recognition_score": 0.9911526441855206, "ground_truth": 0}, {"key": "39458032", "model": "llama", "target_model": "claude", "recognition_score": 0.9683812332500574, "ground_truth": 0}, {"key": "39458032", "model": "llama", "target_model": "gpt4", "recognition_score": 0.981735722353667, "ground_truth": 0}, {"key": "39458032", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9805806528416662, "ground_truth": 0}, {"key": "35116452", "model": "llama", "target_model": "llama", "recognition_score": 0.2613309099518727, "ground_truth": 1}, {"key": "35116452", "model": "llama", "target_model": "human", "recognition_score": 0.3830641560159271, "ground_truth": 0}, {"key": "35116452", "model": "llama", "target_model": "claude", "recognition_score": 0.38491215249886523, "ground_truth": 0}, {"key": "35116452", "model": "llama", "target_model": "gpt4", "recognition_score": 0.19193279235209088, "ground_truth": 0}, {"key": "35116452", "model": "llama", "target_model": "gpt35", "recognition_score": 0.2893717228401696, "ground_truth": 0}, {"key": "40107476", "model": "llama", "target_model": "llama", "recognition_score": 0.9079671350873031, "ground_truth": 1}, {"key": "40107476", "model": "llama", "target_model": "human", "recognition_score": 0.9219218346154462, "ground_truth": 0}, {"key": "40107476", "model": "llama", "target_model": "claude", "recognition_score": 0.9219218286367611, "ground_truth": 0}, {"key": "40107476", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9511422165749549, "ground_truth": 0}, {"key": "40107476", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8984105652133151, "ground_truth": 0}, {"key": "39501049", "model": "llama", "target_model": "llama", "recognition_score": 0.9722043762419065, "ground_truth": 1}, {"key": "39501049", "model": "llama", "target_model": "human", "recognition_score": 0.9825575155537882, "ground_truth": 0}, {"key": "39501049", "model": "llama", "target_model": "claude", "recognition_score": 0.9736446469999117, "ground_truth": 0}, {"key": "39501049", "model": "llama", "target_model": "gpt4", "recognition_score": 0.970909243808218, "ground_truth": 0}, {"key": "39501049", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9585377253131653, "ground_truth": 0}, {"key": "39642178", "model": "llama", "target_model": "llama", "recognition_score": 0.7074046954331312, "ground_truth": 1}, {"key": "39642178", "model": "llama", "target_model": "human", "recognition_score": 0.7704648048821925, "ground_truth": 0}, {"key": "39642178", "model": "llama", "target_model": "claude", "recognition_score": 0.5156199293420255, "ground_truth": 0}, {"key": "39642178", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5794004259543192, "ground_truth": 0}, {"key": "39642178", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4804786972123098, "ground_truth": 0}, {"key": "38024796", "model": "llama", "target_model": "llama", "recognition_score": 0.2704801959161228, "ground_truth": 1}, {"key": "38024796", "model": "llama", "target_model": "human", "recognition_score": 0.6057990662978473, "ground_truth": 0}, {"key": "38024796", "model": "llama", "target_model": "claude", "recognition_score": 0.1613202484860851, "ground_truth": 0}, {"key": "38024796", "model": "llama", "target_model": "gpt4", "recognition_score": 0.26740817947380247, "ground_truth": 0}, {"key": "38024796", "model": "llama", "target_model": "gpt35", "recognition_score": 0.25091277075813034, "ground_truth": 0}, {"key": "36652079", "model": "llama", "target_model": "llama", "recognition_score": 0.7662936429182914, "ground_truth": 1}, {"key": "36652079", "model": "llama", "target_model": "human", "recognition_score": 0.6566582519957762, "ground_truth": 0}, {"key": "36652079", "model": "llama", "target_model": "claude", "recognition_score": 0.8539127584831043, "ground_truth": 0}, {"key": "36652079", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7799928879370328, "ground_truth": 0}, {"key": "36652079", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7918210889279698, "ground_truth": 0}, {"key": "32193402", "model": "llama", "target_model": "llama", "recognition_score": 0.8947894562010278, "ground_truth": 1}, {"key": "32193402", "model": "llama", "target_model": "human", "recognition_score": 0.81167601802445, "ground_truth": 0}, {"key": "32193402", "model": "llama", "target_model": "claude", "recognition_score": 0.8365545793922108, "ground_truth": 0}, {"key": "32193402", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9686195718008083, "ground_truth": 0}, {"key": "32193402", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9449947144171859, "ground_truth": 0}, {"key": "32589706", "model": "llama", "target_model": "llama", "recognition_score": 0.8783142428414307, "ground_truth": 1}, {"key": "32589706", "model": "llama", "target_model": "human", "recognition_score": 0.8940517146921538, "ground_truth": 0}, {"key": "32589706", "model": "llama", "target_model": "claude", "recognition_score": 0.8606036186292368, "ground_truth": 0}, {"key": "32589706", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8031738062985989, "ground_truth": 0}, {"key": "32589706", "model": "llama", "target_model": "gpt35", "recognition_score": 0.878314236418568, "ground_truth": 0}, {"key": "38590589", "model": "llama", "target_model": "llama", "recognition_score": 0.7620701290551446, "ground_truth": 1}, {"key": "38590589", "model": "llama", "target_model": "human", "recognition_score": 0.7341195223722674, "ground_truth": 0}, {"key": "38590589", "model": "llama", "target_model": "claude", "recognition_score": 0.7620701099639863, "ground_truth": 0}, {"key": "38590589", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7122322049510744, "ground_truth": 0}, {"key": "38590589", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9019206797066313, "ground_truth": 0}, {"key": "37045414", "model": "llama", "target_model": "llama", "recognition_score": 0.9854964212250266, "ground_truth": 1}, {"key": "37045414", "model": "llama", "target_model": "human", "recognition_score": 0.9785492698540774, "ground_truth": 0}, {"key": "37045414", "model": "llama", "target_model": "claude", "recognition_score": 0.9793540709534995, "ground_truth": 0}, {"key": "37045414", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9453993952514548, "ground_truth": 0}, {"key": "37045414", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9742394445089076, "ground_truth": 0}, {"key": "33310095", "model": "llama", "target_model": "llama", "recognition_score": 0.8976952809325006, "ground_truth": 1}, {"key": "33310095", "model": "llama", "target_model": "human", "recognition_score": 0.8774767761608961, "ground_truth": 0}, {"key": "33310095", "model": "llama", "target_model": "claude", "recognition_score": 0.8354835335249335, "ground_truth": 0}, {"key": "33310095", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9777138131517124, "ground_truth": 0}, {"key": "33310095", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9728307648045098, "ground_truth": 0}, {"key": "37934604", "model": "llama", "target_model": "llama", "recognition_score": 0.9489172650991595, "ground_truth": 1}, {"key": "37934604", "model": "llama", "target_model": "human", "recognition_score": 0.7170118631764695, "ground_truth": 0}, {"key": "37934604", "model": "llama", "target_model": "claude", "recognition_score": 0.9184802513825738, "ground_truth": 0}, {"key": "37934604", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9263037338371938, "ground_truth": 0}, {"key": "37934604", "model": "llama", "target_model": "gpt35", "recognition_score": 0.929440394154642, "ground_truth": 0}, {"key": "39012181", "model": "llama", "target_model": "llama", "recognition_score": 0.9885803855870092, "ground_truth": 1}, {"key": "39012181", "model": "llama", "target_model": "human", "recognition_score": 0.9904406006842454, "ground_truth": 0}, {"key": "39012181", "model": "llama", "target_model": "claude", "recognition_score": 0.993511730440351, "ground_truth": 0}, {"key": "39012181", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9820137906829469, "ground_truth": 0}, {"key": "39012181", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9882221570504673, "ground_truth": 0}, {"key": "40221674", "model": "llama", "target_model": "llama", "recognition_score": 0.992184110734209, "ground_truth": 1}, {"key": "40221674", "model": "llama", "target_model": "human", "recognition_score": 0.9651191123147026, "ground_truth": 0}, {"key": "40221674", "model": "llama", "target_model": "claude", "recognition_score": 0.9871787856861147, "ground_truth": 0}, {"key": "40221674", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9722043751152959, "ground_truth": 0}, {"key": "40221674", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9746286901060239, "ground_truth": 0}, {"key": "36884862", "model": "llama", "target_model": "llama", "recognition_score": 0.9086178987796903, "ground_truth": 1}, {"key": "36884862", "model": "llama", "target_model": "human", "recognition_score": 0.948917261193746, "ground_truth": 0}, {"key": "36884862", "model": "llama", "target_model": "claude", "recognition_score": 0.8558511613022896, "ground_truth": 0}, {"key": "36884862", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9105454023985593, "ground_truth": 0}, {"key": "36884862", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8848377632318206, "ground_truth": 0}, {"key": "39054429", "model": "llama", "target_model": "llama", "recognition_score": 0.41869691223398037, "ground_truth": 1}, {"key": "39054429", "model": "llama", "target_model": "human", "recognition_score": 0.7866228132780612, "ground_truth": 0}, {"key": "39054429", "model": "llama", "target_model": "claude", "recognition_score": 0.32594953202747573, "ground_truth": 0}, {"key": "39054429", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4455295298813218, "ground_truth": 0}, {"key": "39054429", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6859494645683929, "ground_truth": 0}, {"key": "36753964", "model": "llama", "target_model": "llama", "recognition_score": 0.3575675136123367, "ground_truth": 1}, {"key": "36753964", "model": "llama", "target_model": "human", "recognition_score": 0.4378235155827372, "ground_truth": 0}, {"key": "36753964", "model": "llama", "target_model": "claude", "recognition_score": 0.6187804448401832, "ground_truth": 0}, {"key": "36753964", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4785288523942766, "ground_truth": 0}, {"key": "36753964", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4863315154108357, "ground_truth": 0}, {"key": "37612459", "model": "llama", "target_model": "llama", "recognition_score": 0.7690802445922301, "ground_truth": 1}, {"key": "37612459", "model": "llama", "target_model": "human", "recognition_score": 0.8688267742421877, "ground_truth": 0}, {"key": "37612459", "model": "llama", "target_model": "claude", "recognition_score": 0.7505527789811982, "ground_truth": 0}, {"key": "37612459", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7401743641121248, "ground_truth": 0}, {"key": "37612459", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8615382116914081, "ground_truth": 0}, {"key": "36805789", "model": "llama", "target_model": "llama", "recognition_score": 0.8289388052612375, "ground_truth": 1}, {"key": "36805789", "model": "llama", "target_model": "human", "recognition_score": 0.9678992977098065, "ground_truth": 0}, {"key": "36805789", "model": "llama", "target_model": "claude", "recognition_score": 0.9603611600659354, "ground_truth": 0}, {"key": "36805789", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9241418218571534, "ground_truth": 0}, {"key": "36805789", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8187367798619107, "ground_truth": 0}, {"key": "12757394", "model": "llama", "target_model": "llama", "recognition_score": 0.4649015901541481, "ground_truth": 1}, {"key": "12757394", "model": "llama", "target_model": "human", "recognition_score": 0.6654105292360056, "ground_truth": 0}, {"key": "12757394", "model": "llama", "target_model": "claude", "recognition_score": 0.5888891238588947, "ground_truth": 0}, {"key": "12757394", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7185944007652725, "ground_truth": 0}, {"key": "12757394", "model": "llama", "target_model": "gpt35", "recognition_score": 0.674050488066214, "ground_truth": 0}, {"key": "32192542", "model": "llama", "target_model": "llama", "recognition_score": 0.9230391649601565, "ground_truth": 1}, {"key": "32192542", "model": "llama", "target_model": "human", "recognition_score": 0.964051676130681, "ground_truth": 0}, {"key": "32192542", "model": "llama", "target_model": "claude", "recognition_score": 0.9678992902041087, "ground_truth": 0}, {"key": "32192542", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9465966664206176, "ground_truth": 0}, {"key": "32192542", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9485372394875853, "ground_truth": 0}, {"key": "34856060", "model": "llama", "target_model": "llama", "recognition_score": 0.6688802411375556, "ground_truth": 1}, {"key": "34856060", "model": "llama", "target_model": "human", "recognition_score": 0.5331543942040239, "ground_truth": 0}, {"key": "34856060", "model": "llama", "target_model": "claude", "recognition_score": 0.8198933424125143, "ground_truth": 0}, {"key": "34856060", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7648916025242546, "ground_truth": 0}, {"key": "34856060", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7634837517044742, "ground_truth": 0}, {"key": "36083416", "model": "llama", "target_model": "llama", "recognition_score": 0.9719924791154195, "ground_truth": 1}, {"key": "36083416", "model": "llama", "target_model": "human", "recognition_score": 0.9515039967411899, "ground_truth": 0}, {"key": "36083416", "model": "llama", "target_model": "claude", "recognition_score": 0.9626731147120215, "ground_truth": 0}, {"key": "36083416", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9433475746682118, "ground_truth": 0}, {"key": "36083416", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9734434279773867, "ground_truth": 0}, {"key": "33839050", "model": "llama", "target_model": "llama", "recognition_score": 0.6150878525612895, "ground_truth": 1}, {"key": "33839050", "model": "llama", "target_model": "human", "recognition_score": 0.6601723750381621, "ground_truth": 0}, {"key": "33839050", "model": "llama", "target_model": "claude", "recognition_score": 0.6531269231043995, "ground_truth": 0}, {"key": "33839050", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6261242003747394, "ground_truth": 0}, {"key": "33839050", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5945512514083355, "ground_truth": 0}, {"key": "18464690", "model": "llama", "target_model": "llama", "recognition_score": 0.7431680068993818, "ground_truth": 1}, {"key": "18464690", "model": "llama", "target_model": "human", "recognition_score": 0.852935485324716, "ground_truth": 0}, {"key": "18464690", "model": "llama", "target_model": "claude", "recognition_score": 0.7416740112815849, "ground_truth": 0}, {"key": "18464690", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6076631675894484, "ground_truth": 0}, {"key": "18464690", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6424324780682931, "ground_truth": 0}, {"key": "39212665", "model": "llama", "target_model": "llama", "recognition_score": 0.3647775398892117, "ground_truth": 1}, {"key": "39212665", "model": "llama", "target_model": "human", "recognition_score": 0.3539862946512288, "ground_truth": 0}, {"key": "39212665", "model": "llama", "target_model": "claude", "recognition_score": 0.26133091381174345, "ground_truth": 0}, {"key": "39212665", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4610167908552985, "ground_truth": 0}, {"key": "39212665", "model": "llama", "target_model": "gpt35", "recognition_score": 0.23370635139699, "ground_truth": 0}, {"key": "40094011", "model": "llama", "target_model": "llama", "recognition_score": 0.7918210646304555, "ground_truth": 1}, {"key": "40094011", "model": "llama", "target_model": "human", "recognition_score": 0.8933093924497826, "ground_truth": 0}, {"key": "40094011", "model": "llama", "target_model": "claude", "recognition_score": 0.8344068906781116, "ground_truth": 0}, {"key": "40094011", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8976952894958014, "ground_truth": 0}, {"key": "40094011", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8459424395100476, "ground_truth": 0}, {"key": "36036272", "model": "llama", "target_model": "llama", "recognition_score": 0.8633916102968858, "ground_truth": 1}, {"key": "36036272", "model": "llama", "target_model": "human", "recognition_score": 0.7295197959973347, "ground_truth": 0}, {"key": "36036272", "model": "llama", "target_model": "claude", "recognition_score": 0.654894713282969, "ground_truth": 0}, {"key": "36036272", "model": "llama", "target_model": "gpt4", "recognition_score": 0.783988472821581, "ground_truth": 0}, {"key": "36036272", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7799929005175691, "ground_truth": 0}, {"key": "30681904", "model": "llama", "target_model": "llama", "recognition_score": 0.5679365747682613, "ground_truth": 1}, {"key": "30681904", "model": "llama", "target_model": "human", "recognition_score": 0.4378235178289401, "ground_truth": 0}, {"key": "30681904", "model": "llama", "target_model": "claude", "recognition_score": 0.5136684825867556, "ground_truth": 0}, {"key": "30681904", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3793783822881395, "ground_truth": 0}, {"key": "30681904", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3830641746084217, "ground_truth": 0}, {"key": "27834240", "model": "llama", "target_model": "llama", "recognition_score": 0.14033625618715512, "ground_truth": 1}, {"key": "27834240", "model": "llama", "target_model": "human", "recognition_score": 0.24798745030446412, "ground_truth": 0}, {"key": "27834240", "model": "llama", "target_model": "claude", "recognition_score": 0.21206879823740377, "ground_truth": 0}, {"key": "27834240", "model": "llama", "target_model": "gpt4", "recognition_score": 0.17667160680957353, "ground_truth": 0}, {"key": "27834240", "model": "llama", "target_model": "gpt35", "recognition_score": 0.355774882253782, "ground_truth": 0}, {"key": "35025075", "model": "llama", "target_model": "llama", "recognition_score": 0.5888891519380476, "ground_truth": 1}, {"key": "35025075", "model": "llama", "target_model": "human", "recognition_score": 0.8652240884537024, "ground_truth": 0}, {"key": "35025075", "model": "llama", "target_model": "claude", "recognition_score": 0.5350984533621335, "ground_truth": 0}, {"key": "35025075", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6926419948536305, "ground_truth": 0}, {"key": "35025075", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7138307857654541, "ground_truth": 0}, {"key": "33316985", "model": "llama", "target_model": "llama", "recognition_score": 0.956308943119163, "ground_truth": 1}, {"key": "33316985", "model": "llama", "target_model": "human", "recognition_score": 0.8824278756729984, "ground_truth": 0}, {"key": "33316985", "model": "llama", "target_model": "claude", "recognition_score": 0.9136765263866923, "ground_truth": 0}, {"key": "33316985", "model": "llama", "target_model": "gpt4", "recognition_score": 0.76908024508116, "ground_truth": 0}, {"key": "33316985", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7866228099976467, "ground_truth": 0}, {"key": "17037056", "model": "llama", "target_model": "llama", "recognition_score": 0.5156199007440997, "ground_truth": 1}, {"key": "17037056", "model": "llama", "target_model": "human", "recognition_score": 0.6757645940372267, "ground_truth": 0}, {"key": "17037056", "model": "llama", "target_model": "claude", "recognition_score": 0.665410533167406, "ground_truth": 0}, {"key": "17037056", "model": "llama", "target_model": "gpt4", "recognition_score": 0.635222420422582, "ground_truth": 0}, {"key": "17037056", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5813031058699529, "ground_truth": 0}, {"key": "34050457", "model": "llama", "target_model": "llama", "recognition_score": 0.7759445731384457, "ground_truth": 1}, {"key": "34050457", "model": "llama", "target_model": "human", "recognition_score": 0.8407826034945007, "ground_truth": 0}, {"key": "34050457", "model": "llama", "target_model": "claude", "recognition_score": 0.9178933780464978, "ground_truth": 0}, {"key": "34050457", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8175744871585388, "ground_truth": 0}, {"key": "34050457", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9173026639316773, "ground_truth": 0}, {"key": "34713745", "model": "llama", "target_model": "llama", "recognition_score": 0.4882833763638788, "ground_truth": 1}, {"key": "34713745", "model": "llama", "target_model": "human", "recognition_score": 0.47463117604572974, "ground_truth": 0}, {"key": "34713745", "model": "llama", "target_model": "claude", "recognition_score": 0.49218812648309723, "ground_truth": 0}, {"key": "34713745", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5563995975449371, "ground_truth": 0}, {"key": "34713745", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7057850285265436, "ground_truth": 0}, {"key": "40856210", "model": "llama", "target_model": "llama", "recognition_score": 0.14223188647837987, "ground_truth": 1}, {"key": "40856210", "model": "llama", "target_model": "human", "recognition_score": 0.267408175339449, "ground_truth": 0}, {"key": "40856210", "model": "llama", "target_model": "claude", "recognition_score": 0.15304214574613756, "ground_truth": 0}, {"key": "40856210", "model": "llama", "target_model": "gpt4", "recognition_score": 0.33982761870109474, "ground_truth": 0}, {"key": "40856210", "model": "llama", "target_model": "gpt35", "recognition_score": 0.1412814196138464, "ground_truth": 0}, {"key": "40848302", "model": "llama", "target_model": "llama", "recognition_score": 0.8976952915700274, "ground_truth": 1}, {"key": "40848302", "model": "llama", "target_model": "human", "recognition_score": 0.9178933698683063, "ground_truth": 0}, {"key": "40848302", "model": "llama", "target_model": "claude", "recognition_score": 0.8661325084443765, "ground_truth": 0}, {"key": "40848302", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8624675305138468, "ground_truth": 0}, {"key": "40848302", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8558511539551884, "ground_truth": 0}, {"key": "40636168", "model": "llama", "target_model": "llama", "recognition_score": 0.4167966230671516, "ground_truth": 1}, {"key": "40636168", "model": "llama", "target_model": "human", "recognition_score": 0.5292634042167925, "ground_truth": 0}, {"key": "40636168", "model": "llama", "target_model": "claude", "recognition_score": 0.640635848473417, "ground_truth": 0}, {"key": "40636168", "model": "llama", "target_model": "gpt4", "recognition_score": 0.36477756456098104, "ground_truth": 0}, {"key": "40636168", "model": "llama", "target_model": "gpt35", "recognition_score": 0.35220178732966956, "ground_truth": 0}, {"key": "34423311", "model": "llama", "target_model": "llama", "recognition_score": 0.893309408900115, "ground_truth": 1}, {"key": "34423311", "model": "llama", "target_model": "human", "recognition_score": 0.5136684920361019, "ground_truth": 0}, {"key": "34423311", "model": "llama", "target_model": "claude", "recognition_score": 0.863391604612111, "ground_truth": 0}, {"key": "34423311", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7057850301873922, "ground_truth": 0}, {"key": "34423311", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8479677615807316, "ground_truth": 0}, {"key": "34833945", "model": "llama", "target_model": "llama", "recognition_score": 0.9763105314672964, "ground_truth": 1}, {"key": "34833945", "model": "llama", "target_model": "human", "recognition_score": 0.9728307667245799, "ground_truth": 0}, {"key": "34833945", "model": "llama", "target_model": "claude", "recognition_score": 0.9838471649208703, "ground_truth": 0}, {"key": "34833945", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9883127426114011, "ground_truth": 0}, {"key": "34833945", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9863631641123607, "ground_truth": 0}, {"key": "21272328", "model": "llama", "target_model": "llama", "recognition_score": 0.19682620650912844, "ground_truth": 1}, {"key": "21272328", "model": "llama", "target_model": "human", "recognition_score": 0.685949473152583, "ground_truth": 0}, {"key": "21272328", "model": "llama", "target_model": "claude", "recognition_score": 0.4824291290053966, "ground_truth": 0}, {"key": "21272328", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2583259996453516, "ground_truth": 0}, {"key": "21272328", "model": "llama", "target_model": "gpt35", "recognition_score": 0.22678362020627735, "ground_truth": 0}, {"key": "38648957", "model": "llama", "target_model": "llama", "recognition_score": 0.5058591038818854, "ground_truth": 1}, {"key": "38648957", "model": "llama", "target_model": "human", "recognition_score": 0.19930801221331726, "ground_truth": 0}, {"key": "38648957", "model": "llama", "target_model": "claude", "recognition_score": 0.36477755588297145, "ground_truth": 0}, {"key": "38648957", "model": "llama", "target_model": "gpt4", "recognition_score": 0.24364245416450409, "ground_truth": 0}, {"key": "38648957", "model": "llama", "target_model": "gpt35", "recognition_score": 0.2909808361764833, "ground_truth": 0}, {"key": "24942981", "model": "llama", "target_model": "llama", "recognition_score": 0.23934935400469248, "ground_truth": 1}, {"key": "24942981", "model": "llama", "target_model": "human", "recognition_score": 0.1699562293134844, "ground_truth": 0}, {"key": "24942981", "model": "llama", "target_model": "claude", "recognition_score": 0.26435836980849076, "ground_truth": 0}, {"key": "24942981", "model": "llama", "target_model": "gpt4", "recognition_score": 0.23510839049667515, "ground_truth": 0}, {"key": "24942981", "model": "llama", "target_model": "gpt35", "recognition_score": 0.49804686047058183, "ground_truth": 0}, {"key": "35882366", "model": "llama", "target_model": "llama", "recognition_score": 0.23231015209579725, "ground_truth": 1}, {"key": "35882366", "model": "llama", "target_model": "human", "recognition_score": 0.8068526196680668, "ground_truth": 0}, {"key": "35882366", "model": "llama", "target_model": "claude", "recognition_score": 0.21337717376678858, "ground_truth": 0}, {"key": "35882366", "model": "llama", "target_model": "gpt4", "recognition_score": 0.23370633981511357, "ground_truth": 0}, {"key": "35882366", "model": "llama", "target_model": "gpt35", "recognition_score": 0.20817893495672754, "ground_truth": 0}, {"key": "40559523", "model": "llama", "target_model": "llama", "recognition_score": 0.8459424439152943, "ground_truth": 1}, {"key": "40559523", "model": "llama", "target_model": "human", "recognition_score": 0.8864204047409623, "ground_truth": 0}, {"key": "40559523", "model": "llama", "target_model": "claude", "recognition_score": 0.800691991398146, "ground_truth": 0}, {"key": "40559523", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8244619209099479, "ground_truth": 0}, {"key": "40559523", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8175744794051154, "ground_truth": 0}, {"key": "24632722", "model": "llama", "target_model": "llama", "recognition_score": 0.7431680238927698, "ground_truth": 1}, {"key": "24632722", "model": "llama", "target_model": "human", "recognition_score": 0.4474602947100401, "ground_truth": 0}, {"key": "24632722", "model": "llama", "target_model": "claude", "recognition_score": 0.5058591079082174, "ground_truth": 0}, {"key": "24632722", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7057850391959795, "ground_truth": 0}, {"key": "24632722", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7826624676579147, "ground_truth": 0}, {"key": "36002759", "model": "llama", "target_model": "llama", "recognition_score": 0.7918210545273006, "ground_truth": 1}, {"key": "36002759", "model": "llama", "target_model": "human", "recognition_score": 0.6808786103805514, "ground_truth": 0}, {"key": "36002759", "model": "llama", "target_model": "claude", "recognition_score": 0.8670357646672681, "ground_truth": 0}, {"key": "36002759", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5273165496368671, "ground_truth": 0}, {"key": "36002759", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8376199533976523, "ground_truth": 0}, {"key": "29508534", "model": "llama", "target_model": "llama", "recognition_score": 0.899827792706457, "ground_truth": 1}, {"key": "29508534", "model": "llama", "target_model": "human", "recognition_score": 0.819893340617442, "ground_truth": 0}, {"key": "29508534", "model": "llama", "target_model": "claude", "recognition_score": 0.9099070144265684, "ground_truth": 0}, {"key": "29508534", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8539127401891312, "ground_truth": 0}, {"key": "29508534", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8864204166407097, "ground_truth": 0}, {"key": "15631612", "model": "llama", "target_model": "llama", "recognition_score": 0.9167080762915154, "ground_truth": 1}, {"key": "15631612", "model": "llama", "target_model": "human", "recognition_score": 0.8643104556093919, "ground_truth": 0}, {"key": "15631612", "model": "llama", "target_model": "claude", "recognition_score": 0.8955226780820306, "ground_truth": 0}, {"key": "15631612", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8791467639159289, "ground_truth": 0}, {"key": "15631612", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9053222957321035, "ground_truth": 0}, {"key": "40731892", "model": "llama", "target_model": "llama", "recognition_score": 0.30074556633680444, "ground_truth": 1}, {"key": "40731892", "model": "llama", "target_model": "human", "recognition_score": 0.27825679267754594, "ground_truth": 0}, {"key": "40731892", "model": "llama", "target_model": "claude", "recognition_score": 0.5563995507755486, "ground_truth": 0}, {"key": "40731892", "model": "llama", "target_model": "gpt4", "recognition_score": 0.75055276913929, "ground_truth": 0}, {"key": "40731892", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4493926701111962, "ground_truth": 0}, {"key": "35971910", "model": "llama", "target_model": "llama", "recognition_score": 0.8872045875879199, "ground_truth": 1}, {"key": "35971910", "model": "llama", "target_model": "human", "recognition_score": 0.9485372353298726, "ground_truth": 0}, {"key": "35971910", "model": "llama", "target_model": "claude", "recognition_score": 0.9136765294601111, "ground_truth": 0}, {"key": "35971910", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9511422181430877, "ground_truth": 0}, {"key": "35971910", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9019206679580986, "ground_truth": 0}, {"key": "34428424", "model": "llama", "target_model": "llama", "recognition_score": 0.9711290930064685, "ground_truth": 1}, {"key": "34428424", "model": "llama", "target_model": "human", "recognition_score": 0.9757623654172112, "ground_truth": 0}, {"key": "34428424", "model": "llama", "target_model": "claude", "recognition_score": 0.9866748518324343, "ground_truth": 0}, {"key": "34428424", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9811668734602191, "ground_truth": 0}, {"key": "34428424", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9748211604601218, "ground_truth": 0}, {"key": "36971005", "model": "llama", "target_model": "llama", "recognition_score": 0.9748211559780865, "ground_truth": 1}, {"key": "36971005", "model": "llama", "target_model": "human", "recognition_score": 0.9681411380188388, "ground_truth": 0}, {"key": "36971005", "model": "llama", "target_model": "claude", "recognition_score": 0.9817357219515913, "ground_truth": 0}, {"key": "36971005", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9412234452836155, "ground_truth": 0}, {"key": "36971005", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9575961739911754, "ground_truth": 0}, {"key": "34649067", "model": "llama", "target_model": "llama", "recognition_score": 0.3225259968188485, "ground_truth": 1}, {"key": "34649067", "model": "llama", "target_model": "human", "recognition_score": 0.1412814215443523, "ground_truth": 0}, {"key": "34649067", "model": "llama", "target_model": "claude", "recognition_score": 0.13568954131503383, "ground_truth": 0}, {"key": "34649067", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2465333469059748, "ground_truth": 0}, {"key": "34649067", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3007455876846632, "ground_truth": 0}, {"key": "37355154", "model": "llama", "target_model": "llama", "recognition_score": 0.06142403856536409, "ground_truth": 1}, {"key": "37355154", "model": "llama", "target_model": "human", "recognition_score": 0.12765263219667794, "ground_truth": 0}, {"key": "37355154", "model": "llama", "target_model": "claude", "recognition_score": 0.10158944633729851, "ground_truth": 0}, {"key": "37355154", "model": "llama", "target_model": "gpt4", "recognition_score": 0.17781086471153057, "ground_truth": 0}, {"key": "37355154", "model": "llama", "target_model": "gpt35", "recognition_score": 0.1356895385359465, "ground_truth": 0}, {"key": "38674697", "model": "llama", "target_model": "llama", "recognition_score": 0.5964331643178328, "ground_truth": 1}, {"key": "38674697", "model": "llama", "target_model": "human", "recognition_score": 0.4960938248070594, "ground_truth": 0}, {"key": "38674697", "model": "llama", "target_model": "claude", "recognition_score": 0.6424324770986659, "ground_truth": 0}, {"key": "38674697", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5736784026824447, "ground_truth": 0}, {"key": "38674697", "model": "llama", "target_model": "gpt35", "recognition_score": 0.401687804347079, "ground_truth": 0}, {"key": "40525767", "model": "llama", "target_model": "llama", "recognition_score": 0.9429286048060118, "ground_truth": 1}, {"key": "40525767", "model": "llama", "target_model": "human", "recognition_score": 0.9854964192884549, "ground_truth": 0}, {"key": "40525767", "model": "llama", "target_model": "claude", "recognition_score": 0.953621792359898, "ground_truth": 0}, {"key": "40525767", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9367494789103136, "ground_truth": 0}, {"key": "40525767", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9412234423327661, "ground_truth": 0}, {"key": "27165110", "model": "llama", "target_model": "llama", "recognition_score": 0.11757213880662327, "ground_truth": 1}, {"key": "27165110", "model": "llama", "target_model": "human", "recognition_score": 0.24798743646591737, "ground_truth": 0}, {"key": "27165110", "model": "llama", "target_model": "claude", "recognition_score": 0.0913821055472864, "ground_truth": 0}, {"key": "27165110", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2909808754980116, "ground_truth": 0}, {"key": "27165110", "model": "llama", "target_model": "gpt35", "recognition_score": 0.15203223224575835, "ground_truth": 0}, {"key": "35497491", "model": "llama", "target_model": "llama", "recognition_score": 0.7295197693522586, "ground_truth": 1}, {"key": "35497491", "model": "llama", "target_model": "human", "recognition_score": 0.8596637372911283, "ground_truth": 0}, {"key": "35497491", "model": "llama", "target_model": "claude", "recognition_score": 0.7577943656071884, "ground_truth": 0}, {"key": "35497491", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7106283223926557, "ground_truth": 0}, {"key": "35497491", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6740504889113357, "ground_truth": 0}, {"key": "40690716", "model": "llama", "target_model": "llama", "recognition_score": 0.8732148224783821, "ground_truth": 1}, {"key": "40690716", "model": "llama", "target_model": "human", "recognition_score": 0.9353465046756424, "ground_truth": 0}, {"key": "40690716", "model": "llama", "target_model": "claude", "recognition_score": 0.9609517111965749, "ground_truth": 0}, {"key": "40690716", "model": "llama", "target_model": "gpt4", "recognition_score": 0.938575955654796, "ground_truth": 0}, {"key": "40690716", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9433475811186074, "ground_truth": 0}, {"key": "34835193", "model": "llama", "target_model": "llama", "recognition_score": 0.95945926179229, "ground_truth": 1}, {"key": "34835193", "model": "llama", "target_model": "human", "recognition_score": 0.9572778004412411, "ground_truth": 0}, {"key": "34835193", "model": "llama", "target_model": "claude", "recognition_score": 0.969324199661421, "ground_truth": 0}, {"key": "34835193", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9566342001438878, "ground_truth": 0}, {"key": "34835193", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9546474241162345, "ground_truth": 0}, {"key": "39471712", "model": "llama", "target_model": "llama", "recognition_score": 0.7520125760336622, "ground_truth": 1}, {"key": "39471712", "model": "llama", "target_model": "human", "recognition_score": 0.6424324672231466, "ground_truth": 0}, {"key": "39471712", "model": "llama", "target_model": "claude", "recognition_score": 0.7759445667132707, "ground_truth": 0}, {"key": "39471712", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8548846272059901, "ground_truth": 0}, {"key": "39471712", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8255897216485646, "ground_truth": 0}, {"key": "39115192", "model": "llama", "target_model": "llama", "recognition_score": 0.8783142402914621, "ground_truth": 1}, {"key": "39115192", "model": "llama", "target_model": "human", "recognition_score": 0.8376199529958135, "ground_truth": 0}, {"key": "39115192", "model": "llama", "target_model": "claude", "recognition_score": 0.9092645102446523, "ground_truth": 0}, {"key": "39115192", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7138307470056179, "ground_truth": 0}, {"key": "39115192", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8661325140818149, "ground_truth": 0}, {"key": "23520673", "model": "llama", "target_model": "llama", "recognition_score": 0.29421496327164687, "ground_truth": 1}, {"key": "23520673", "model": "llama", "target_model": "human", "recognition_score": 0.478528835348811, "ground_truth": 0}, {"key": "23520673", "model": "llama", "target_model": "claude", "recognition_score": 0.605799059376214, "ground_truth": 0}, {"key": "23520673", "model": "llama", "target_model": "gpt4", "recognition_score": 0.39420094468022465, "ground_truth": 0}, {"key": "23520673", "model": "llama", "target_model": "gpt35", "recognition_score": 0.44167301086225513, "ground_truth": 0}, {"key": "35764233", "model": "llama", "target_model": "llama", "recognition_score": 0.8278281391411543, "ground_truth": 1}, {"key": "35764233", "model": "llama", "target_model": "human", "recognition_score": 0.638835268512305, "ground_truth": 0}, {"key": "35764233", "model": "llama", "target_model": "claude", "recognition_score": 0.7772998705849659, "ground_truth": 0}, {"key": "35764233", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6688802505707168, "ground_truth": 0}, {"key": "35764233", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7732163687926731, "ground_truth": 0}, {"key": "35228910", "model": "llama", "target_model": "llama", "recognition_score": 0.482429101089326, "ground_truth": 1}, {"key": "35228910", "model": "llama", "target_model": "human", "recognition_score": 0.5698526528962315, "ground_truth": 0}, {"key": "35228910", "model": "llama", "target_model": "claude", "recognition_score": 0.4687906497701413, "ground_truth": 0}, {"key": "35228910", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5312093526529409, "ground_truth": 0}, {"key": "35228910", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4707366082905186, "ground_truth": 0}, {"key": "36795599", "model": "llama", "target_model": "llama", "recognition_score": 0.9753900729219999, "ground_truth": 1}, {"key": "36795599", "model": "llama", "target_model": "human", "recognition_score": 0.9492946390865014, "ground_truth": 0}, {"key": "36795599", "model": "llama", "target_model": "claude", "recognition_score": 0.9740426438460653, "ground_truth": 0}, {"key": "36795599", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9492946329147224, "ground_truth": 0}, {"key": "36795599", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9609517052847105, "ground_truth": 0}, {"key": "38641949", "model": "llama", "target_model": "llama", "recognition_score": 0.8723473664894507, "ground_truth": 1}, {"key": "38641949", "model": "llama", "target_model": "human", "recognition_score": 0.8705972729094278, "ground_truth": 0}, {"key": "38641949", "model": "llama", "target_model": "claude", "recognition_score": 0.8354835571651177, "ground_truth": 0}, {"key": "38641949", "model": "llama", "target_model": "gpt4", "recognition_score": 0.821044107738255, "ground_truth": 0}, {"key": "38641949", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7648916211279292, "ground_truth": 0}, {"key": "29968443", "model": "llama", "target_model": "llama", "recognition_score": 0.961533809367967, "ground_truth": 1}, {"key": "29968443", "model": "llama", "target_model": "human", "recognition_score": 0.9358173536278079, "ground_truth": 0}, {"key": "29968443", "model": "llama", "target_model": "claude", "recognition_score": 0.9713473315463986, "ground_truth": 0}, {"key": "29968443", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9536217948750245, "ground_truth": 0}, {"key": "29968443", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9543079618136612, "ground_truth": 0}, {"key": "21268042", "model": "llama", "target_model": "llama", "recognition_score": 0.7813306301255459, "ground_truth": 1}, {"key": "21268042", "model": "llama", "target_model": "human", "recognition_score": 0.8714748733612424, "ground_truth": 0}, {"key": "21268042", "model": "llama", "target_model": "claude", "recognition_score": 0.7905303101992922, "ground_truth": 0}, {"key": "21268042", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9348724574482405, "ground_truth": 0}, {"key": "21268042", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8840392879420009, "ground_truth": 0}, {"key": "26808572", "model": "llama", "target_model": "llama", "recognition_score": 0.8624675490456766, "ground_truth": 1}, {"key": "26808572", "model": "llama", "target_model": "human", "recognition_score": 0.6206216377274205, "ground_truth": 0}, {"key": "26808572", "model": "llama", "target_model": "claude", "recognition_score": 0.7592254085481059, "ground_truth": 0}, {"key": "26808572", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9142907248648647, "ground_truth": 0}, {"key": "26808572", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9178933696044014, "ground_truth": 0}, {"key": "37829390", "model": "llama", "target_model": "llama", "recognition_score": 0.9005297794932767, "ground_truth": 1}, {"key": "37829390", "model": "llama", "target_model": "human", "recognition_score": 0.9390248186946879, "ground_truth": 0}, {"key": "37829390", "model": "llama", "target_model": "claude", "recognition_score": 0.9372107934917662, "ground_truth": 0}, {"key": "37829390", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9167080769200958, "ground_truth": 0}, {"key": "37829390", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8807970676652654, "ground_truth": 0}, {"key": "35716045", "model": "llama", "target_model": "llama", "recognition_score": 0.9399133504649355, "ground_truth": 1}, {"key": "35716045", "model": "llama", "target_model": "human", "recognition_score": 0.9026095956523551, "ground_truth": 0}, {"key": "35716045", "model": "llama", "target_model": "claude", "recognition_score": 0.9066531303512768, "ground_truth": 0}, {"key": "35716045", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9241418138324698, "ground_truth": 0}, {"key": "35716045", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9566342000125783, "ground_truth": 0}, {"key": "34367070", "model": "llama", "target_model": "llama", "recognition_score": 0.9142907319896791, "ground_truth": 1}, {"key": "34367070", "model": "llama", "target_model": "human", "recognition_score": 0.9429286004698765, "ground_truth": 0}, {"key": "34367070", "model": "llama", "target_model": "claude", "recognition_score": 0.8895288519615315, "ground_truth": 0}, {"key": "34367070", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9053223004556459, "ground_truth": 0}, {"key": "34367070", "model": "llama", "target_model": "gpt35", "recognition_score": 0.890294223321554, "ground_truth": 0}, {"key": "35239748", "model": "llama", "target_model": "llama", "recognition_score": 0.7786493162559742, "ground_truth": 1}, {"key": "35239748", "model": "llama", "target_model": "human", "recognition_score": 0.7592254019348367, "ground_truth": 0}, {"key": "35239748", "model": "llama", "target_model": "claude", "recognition_score": 0.7759445585550521, "ground_truth": 0}, {"key": "35239748", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6654105647843045, "ground_truth": 0}, {"key": "35239748", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8198933451801296, "ground_truth": 0}, {"key": "40421370", "model": "llama", "target_model": "llama", "recognition_score": 0.6976089493215616, "ground_truth": 1}, {"key": "40421370", "model": "llama", "target_model": "human", "recognition_score": 0.5679366204190771, "ground_truth": 0}, {"key": "40421370", "model": "llama", "target_model": "claude", "recognition_score": 0.5078118685329669, "ground_truth": 0}, {"key": "40421370", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7866228153568616, "ground_truth": 0}, {"key": "40421370", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6406358455396783, "ground_truth": 0}, {"key": "37288396", "model": "llama", "target_model": "llama", "recognition_score": 0.8311430366626262, "ground_truth": 1}, {"key": "37288396", "model": "llama", "target_model": "human", "recognition_score": 0.6959583331362038, "ground_truth": 0}, {"key": "37288396", "model": "llama", "target_model": "claude", "recognition_score": 0.8856314768129787, "ground_truth": 0}, {"key": "37288396", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7839884661458647, "ground_truth": 0}, {"key": "37288396", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8322366679886142, "ground_truth": 0}, {"key": "38903688", "model": "llama", "target_model": "llama", "recognition_score": 0.9626731114199288, "ground_truth": 1}, {"key": "38903688", "model": "llama", "target_model": "human", "recognition_score": 0.943347573090849, "ground_truth": 0}, {"key": "38903688", "model": "llama", "target_model": "claude", "recognition_score": 0.9500414817540668, "ground_truth": 0}, {"key": "38903688", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9230391547285218, "ground_truth": 0}, {"key": "38903688", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8624675239938695, "ground_truth": 0}, {"key": "28071228", "model": "llama", "target_model": "llama", "recognition_score": 0.8940517041881859, "ground_truth": 1}, {"key": "28071228", "model": "llama", "target_model": "human", "recognition_score": 0.9304582611270726, "ground_truth": 0}, {"key": "28071228", "model": "llama", "target_model": "claude", "recognition_score": 0.9458012742396188, "ground_truth": 0}, {"key": "28071228", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9376689577269701, "ground_truth": 0}, {"key": "28071228", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9591542842682408, "ground_truth": 0}, {"key": "36855834", "model": "llama", "target_model": "llama", "recognition_score": 0.7490872194122506, "ground_truth": 1}, {"key": "36855834", "model": "llama", "target_model": "human", "recognition_score": 0.7476159576391913, "ground_truth": 0}, {"key": "36855834", "model": "llama", "target_model": "claude", "recognition_score": 0.695958312465188, "ground_truth": 0}, {"key": "36855834", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8879840518637393, "ground_truth": 0}, {"key": "36855834", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7634837549761897, "ground_truth": 0}, {"key": "40548717", "model": "llama", "target_model": "llama", "recognition_score": 0.5486734780798418, "ground_truth": 1}, {"key": "40548717", "model": "llama", "target_model": "human", "recognition_score": 0.35398629570866674, "ground_truth": 0}, {"key": "40548717", "model": "llama", "target_model": "claude", "recognition_score": 0.42632156925188175, "ground_truth": 0}, {"key": "40548717", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7248702788692185, "ground_truth": 0}, {"key": "40548717", "model": "llama", "target_model": "gpt35", "recognition_score": 0.44167299266668286, "ground_truth": 0}, {"key": "37051175", "model": "llama", "target_model": "llama", "recognition_score": 0.8991213750027262, "ground_truth": 1}, {"key": "37051175", "model": "llama", "target_model": "human", "recognition_score": 0.8962513647531378, "ground_truth": 0}, {"key": "37051175", "model": "llama", "target_model": "claude", "recognition_score": 0.7371581742465116, "ground_truth": 0}, {"key": "37051175", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8962513756907354, "ground_truth": 0}, {"key": "37051175", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9358173568713679, "ground_truth": 0}, {"key": "38882119", "model": "llama", "target_model": "llama", "recognition_score": 0.8807970769558298, "ground_truth": 1}, {"key": "38882119", "model": "llama", "target_model": "human", "recognition_score": 0.7264256196381713, "ground_truth": 0}, {"key": "38882119", "model": "llama", "target_model": "claude", "recognition_score": 0.9235923096850505, "ground_truth": 0}, {"key": "38882119", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9722043773929354, "ground_truth": 0}, {"key": "38882119", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8568123078718307, "ground_truth": 0}, {"key": "19485402", "model": "llama", "target_model": "llama", "recognition_score": 0.8128673204429098, "ground_truth": 1}, {"key": "19485402", "model": "llama", "target_model": "human", "recognition_score": 0.8705972691813567, "ground_truth": 0}, {"key": "19485402", "model": "llama", "target_model": "claude", "recognition_score": 0.8407826107494603, "ground_truth": 0}, {"key": "19485402", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8152324917683664, "ground_truth": 0}, {"key": "19485402", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6113819755831718, "ground_truth": 0}, {"key": "36060907", "model": "llama", "target_model": "llama", "recognition_score": 0.6297746147036908, "ground_truth": 1}, {"key": "36060907", "model": "llama", "target_model": "human", "recognition_score": 0.6757646123649761, "ground_truth": 0}, {"key": "36060907", "model": "llama", "target_model": "claude", "recognition_score": 0.5698526691324262, "ground_truth": 0}, {"key": "36060907", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6076631671840704, "ground_truth": 0}, {"key": "36060907", "model": "llama", "target_model": "gpt35", "recognition_score": 0.695958320425324, "ground_truth": 0}, {"key": "24037309", "model": "llama", "target_model": "llama", "recognition_score": 0.7490872163506102, "ground_truth": 1}, {"key": "24037309", "model": "llama", "target_model": "human", "recognition_score": 0.9278877980814548, "ground_truth": 0}, {"key": "24037309", "model": "llama", "target_model": "claude", "recognition_score": 0.8397339632008867, "ground_truth": 0}, {"key": "24037309", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8705972724211194, "ground_truth": 0}, {"key": "24037309", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7879311945882393, "ground_truth": 0}, {"key": "35605805", "model": "llama", "target_model": "llama", "recognition_score": 0.8104789042380148, "ground_truth": 1}, {"key": "35605805", "model": "llama", "target_model": "human", "recognition_score": 0.8697145769267108, "ground_truth": 0}, {"key": "35605805", "model": "llama", "target_model": "claude", "recognition_score": 0.7264256057551126, "ground_truth": 0}, {"key": "35605805", "model": "llama", "target_model": "gpt4", "recognition_score": 0.837619944250506, "ground_truth": 0}, {"key": "35605805", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8548846312581946, "ground_truth": 0}, {"key": "17706248", "model": "llama", "target_model": "llama", "recognition_score": 0.5869963986291036, "ground_truth": 1}, {"key": "17706248", "model": "llama", "target_model": "human", "recognition_score": 0.5273165037882496, "ground_truth": 0}, {"key": "17706248", "model": "llama", "target_model": "claude", "recognition_score": 0.5907791816424481, "ground_truth": 0}, {"key": "17706248", "model": "llama", "target_model": "gpt4", "recognition_score": 0.503906152543002, "ground_truth": 0}, {"key": "17706248", "model": "llama", "target_model": "gpt35", "recognition_score": 0.49218812841491233, "ground_truth": 0}, {"key": "36883559", "model": "llama", "target_model": "llama", "recognition_score": 0.9399133531090584, "ground_truth": 1}, {"key": "36883559", "model": "llama", "target_model": "human", "recognition_score": 0.7732163952828344, "ground_truth": 0}, {"key": "36883559", "model": "llama", "target_model": "claude", "recognition_score": 0.7386690817210636, "ground_truth": 0}, {"key": "36883559", "model": "llama", "target_model": "gpt4", "recognition_score": 0.864310443975662, "ground_truth": 0}, {"key": "36883559", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8749346101378682, "ground_truth": 0}, {"key": "32799471", "model": "llama", "target_model": "llama", "recognition_score": 0.8848377673441228, "ground_truth": 1}, {"key": "32799471", "model": "llama", "target_model": "human", "recognition_score": 0.8910549436041442, "ground_truth": 0}, {"key": "32799471", "model": "llama", "target_model": "claude", "recognition_score": 0.8633916130609077, "ground_truth": 0}, {"key": "32799471", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8918110468969886, "ground_truth": 0}, {"key": "32799471", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8152324868147253, "ground_truth": 0}, {"key": "34797243", "model": "llama", "target_model": "llama", "recognition_score": 0.4148988218239339, "ground_truth": 1}, {"key": "34797243", "model": "llama", "target_model": "human", "recognition_score": 0.6723317169988348, "ground_truth": 0}, {"key": "34797243", "model": "llama", "target_model": "claude", "recognition_score": 0.8365545658666481, "ground_truth": 0}, {"key": "34797243", "model": "llama", "target_model": "gpt4", "recognition_score": 0.712232156647946, "ground_truth": 0}, {"key": "34797243", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6442251247811928, "ground_truth": 0}, {"key": "32154876", "model": "llama", "target_model": "llama", "recognition_score": 0.1943678195439926, "ground_truth": 1}, {"key": "32154876", "model": "llama", "target_model": "human", "recognition_score": 0.4301473454265195, "ground_truth": 0}, {"key": "32154876", "model": "llama", "target_model": "claude", "recognition_score": 0.43974733631776886, "ground_truth": 0}, {"key": "32154876", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3293917276384098, "ground_truth": 0}, {"key": "32154876", "model": "llama", "target_model": "gpt35", "recognition_score": 0.19314736979758995, "ground_truth": 0}, {"key": "37962274", "model": "llama", "target_model": "llama", "recognition_score": 0.8791467732733548, "ground_truth": 1}, {"key": "37962274", "model": "llama", "target_model": "human", "recognition_score": 0.836554557041953, "ground_truth": 0}, {"key": "37962274", "model": "llama", "target_model": "claude", "recognition_score": 0.8198933507570354, "ground_truth": 0}, {"key": "37962274", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7138307481418243, "ground_truth": 0}, {"key": "37962274", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7956580839768018, "ground_truth": 0}, {"key": "35574030", "model": "llama", "target_model": "llama", "recognition_score": 0.7662936440103078, "ground_truth": 1}, {"key": "35574030", "model": "llama", "target_model": "human", "recognition_score": 0.8902942192344534, "ground_truth": 0}, {"key": "35574030", "model": "llama", "target_model": "claude", "recognition_score": 0.8697145917947201, "ground_truth": 0}, {"key": "35574030", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8940517024719696, "ground_truth": 0}, {"key": "35574030", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8558511376187645, "ground_truth": 0}, {"key": "39105949", "model": "llama", "target_model": "llama", "recognition_score": 0.5717665888558622, "ground_truth": 1}, {"key": "39105949", "model": "llama", "target_model": "human", "recognition_score": 0.8056321912404228, "ground_truth": 0}, {"key": "39105949", "model": "llama", "target_model": "claude", "recognition_score": 0.8376199757032523, "ground_truth": 0}, {"key": "39105949", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8164063674508808, "ground_truth": 0}, {"key": "39105949", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8489721949007529, "ground_truth": 0}, {"key": "41064322", "model": "llama", "target_model": "llama", "recognition_score": 0.9671630441222514, "ground_truth": 1}, {"key": "41064322", "model": "llama", "target_model": "human", "recognition_score": 0.9850429129347889, "ground_truth": 0}, {"key": "41064322", "model": "llama", "target_model": "claude", "recognition_score": 0.9840936083987667, "ground_truth": 0}, {"key": "41064322", "model": "llama", "target_model": "gpt4", "recognition_score": 0.980580651713764, "ground_truth": 0}, {"key": "41064322", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9787126470755837, "ground_truth": 0}, {"key": "28105101", "model": "llama", "target_model": "llama", "recognition_score": 0.8969755772772612, "ground_truth": 1}, {"key": "28105101", "model": "llama", "target_model": "human", "recognition_score": 0.8947894656826101, "ground_truth": 0}, {"key": "28105101", "model": "llama", "target_model": "claude", "recognition_score": 0.838679758067397, "ground_truth": 0}, {"key": "28105101", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8386797643115559, "ground_truth": 0}, {"key": "28105101", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8732148362324119, "ground_truth": 0}, {"key": "36036068", "model": "llama", "target_model": "llama", "recognition_score": 0.8210441084301564, "ground_truth": 1}, {"key": "36036068", "model": "llama", "target_model": "human", "recognition_score": 0.8643104536587126, "ground_truth": 0}, {"key": "36036068", "model": "llama", "target_model": "claude", "recognition_score": 0.8489721845931215, "ground_truth": 0}, {"key": "36036068", "model": "llama", "target_model": "gpt4", "recognition_score": 0.852935475683242, "ground_truth": 0}, {"key": "36036068", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8187367756779087, "ground_truth": 0}, {"key": "37991460", "model": "llama", "target_model": "llama", "recognition_score": 0.8438950964922568, "ground_truth": 1}, {"key": "37991460", "model": "llama", "target_model": "human", "recognition_score": 0.9252299633013145, "ground_truth": 0}, {"key": "37991460", "model": "llama", "target_model": "claude", "recognition_score": 0.8244619267702026, "ground_truth": 0}, {"key": "37991460", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7634837640785233, "ground_truth": 0}, {"key": "37991460", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8548846325563155, "ground_truth": 0}, {"key": "38437830", "model": "llama", "target_model": "llama", "recognition_score": 0.7956581145483419, "ground_truth": 1}, {"key": "38437830", "model": "llama", "target_model": "human", "recognition_score": 0.7772998537592039, "ground_truth": 0}, {"key": "38437830", "model": "llama", "target_model": "claude", "recognition_score": 0.9252299554650405, "ground_truth": 0}, {"key": "38437830", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7956581108543929, "ground_truth": 0}, {"key": "38437830", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8140528222907307, "ground_truth": 0}, {"key": "36507138", "model": "llama", "target_model": "llama", "recognition_score": 0.7577943772548036, "ground_truth": 1}, {"key": "36507138", "model": "llama", "target_model": "human", "recognition_score": 0.533154383268932, "ground_truth": 0}, {"key": "36507138", "model": "llama", "target_model": "claude", "recognition_score": 0.67917869344138, "ground_truth": 0}, {"key": "36507138", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8519528018067919, "ground_truth": 0}, {"key": "36507138", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7295197826047303, "ground_truth": 0}, {"key": "37824866", "model": "llama", "target_model": "llama", "recognition_score": 0.8418256451650904, "ground_truth": 1}, {"key": "37824866", "model": "llama", "target_model": "human", "recognition_score": 0.9155072441098825, "ground_truth": 0}, {"key": "37824866", "model": "llama", "target_model": "claude", "recognition_score": 0.8428631569955368, "ground_truth": 0}, {"key": "37824866", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7799929043771555, "ground_truth": 0}, {"key": "37824866", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7772998794562116, "ground_truth": 0}, {"key": "25088134", "model": "llama", "target_model": "llama", "recognition_score": 0.7025300627531427, "ground_truth": 1}, {"key": "25088134", "model": "llama", "target_model": "human", "recognition_score": 0.8255897432330215, "ground_truth": 0}, {"key": "25088134", "model": "llama", "target_model": "claude", "recognition_score": 0.6636689356179835, "ground_truth": 0}, {"key": "25088134", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5717666314863615, "ground_truth": 0}, {"key": "25088134", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8116760353767163, "ground_truth": 0}, {"key": "40172531", "model": "llama", "target_model": "llama", "recognition_score": 0.8902942134613028, "ground_truth": 1}, {"key": "40172531", "model": "llama", "target_model": "human", "recognition_score": 0.9012274206775112, "ground_truth": 0}, {"key": "40172531", "model": "llama", "target_model": "claude", "recognition_score": 0.8624675153425856, "ground_truth": 0}, {"key": "40172531", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8732148169145134, "ground_truth": 0}, {"key": "40172531", "model": "llama", "target_model": "gpt35", "recognition_score": 0.839733986192522, "ground_truth": 0}, {"key": "37035874", "model": "llama", "target_model": "llama", "recognition_score": 0.4590761389073143, "ground_truth": 1}, {"key": "37035874", "model": "llama", "target_model": "human", "recognition_score": 0.36840570774500203, "ground_truth": 0}, {"key": "37035874", "model": "llama", "target_model": "claude", "recognition_score": 0.5312093555802393, "ground_truth": 0}, {"key": "37035874", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4416729881807374, "ground_truth": 0}, {"key": "37035874", "model": "llama", "target_model": "gpt35", "recognition_score": 0.36840569398270373, "ground_truth": 0}, {"key": "36404465", "model": "llama", "target_model": "llama", "recognition_score": 0.9886682451929757, "ground_truth": 1}, {"key": "36404465", "model": "llama", "target_model": "human", "recognition_score": 0.9954967276856354, "ground_truth": 0}, {"key": "36404465", "model": "llama", "target_model": "claude", "recognition_score": 0.9895109093990518, "ground_truth": 0}, {"key": "36404465", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9914886964557675, "ground_truth": 0}, {"key": "36404465", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9886682481971479, "ground_truth": 0}, {"key": "39602052", "model": "llama", "target_model": "llama", "recognition_score": 0.9235923102644661, "ground_truth": 1}, {"key": "39602052", "model": "llama", "target_model": "human", "recognition_score": 0.9309620650138503, "ground_truth": 0}, {"key": "39602052", "model": "llama", "target_model": "claude", "recognition_score": 0.9394706101952038, "ground_truth": 0}, {"key": "39602052", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9407897462177952, "ground_truth": 0}, {"key": "39602052", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9399133483078485, "ground_truth": 0}, {"key": "33792789", "model": "llama", "target_model": "llama", "recognition_score": 0.8221891369994088, "ground_truth": 1}, {"key": "33792789", "model": "llama", "target_model": "human", "recognition_score": 0.5755880122959264, "ground_truth": 0}, {"key": "33792789", "model": "llama", "target_model": "claude", "recognition_score": 0.8365545504945403, "ground_truth": 0}, {"key": "33792789", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7943849612758582, "ground_truth": 0}, {"key": "33792789", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8418256450980508, "ground_truth": 0}, {"key": "32776626", "model": "llama", "target_model": "llama", "recognition_score": 0.7943849755383683, "ground_truth": 1}, {"key": "32776626", "model": "llama", "target_model": "human", "recognition_score": 0.7217432153828836, "ground_truth": 0}, {"key": "32776626", "model": "llama", "target_model": "claude", "recognition_score": 0.6531269178276868, "ground_truth": 0}, {"key": "32776626", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5078118705160399, "ground_truth": 0}, {"key": "32776626", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7185944202876987, "ground_truth": 0}, {"key": "37195090", "model": "llama", "target_model": "llama", "recognition_score": 0.6442251110613473, "ground_truth": 1}, {"key": "37195090", "model": "llama", "target_model": "human", "recognition_score": 0.8128673169683251, "ground_truth": 0}, {"key": "37195090", "model": "llama", "target_model": "claude", "recognition_score": 0.8278281577886912, "ground_truth": 0}, {"key": "37195090", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8267117777916458, "ground_truth": 0}, {"key": "37195090", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6791787178669021, "ground_truth": 0}, {"key": "33981824", "model": "llama", "target_model": "llama", "recognition_score": 0.2751297379752866, "ground_truth": 1}, {"key": "33981824", "model": "llama", "target_model": "human", "recognition_score": 0.24944723212823067, "ground_truth": 0}, {"key": "33981824", "model": "llama", "target_model": "claude", "recognition_score": 0.47657966524088907, "ground_truth": 0}, {"key": "33981824", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3998116445323304, "ground_truth": 0}, {"key": "33981824", "model": "llama", "target_model": "gpt35", "recognition_score": 0.203074632076208, "ground_truth": 0}, {"key": "39569142", "model": "llama", "target_model": "llama", "recognition_score": 0.5019531343901581, "ground_truth": 1}, {"key": "39569142", "model": "llama", "target_model": "human", "recognition_score": 0.7106283121608654, "ground_truth": 0}, {"key": "39569142", "model": "llama", "target_model": "claude", "recognition_score": 0.4785288247037731, "ground_truth": 0}, {"key": "39569142", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5195213135641711, "ground_truth": 0}, {"key": "39569142", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4111108407931101, "ground_truth": 0}, {"key": "40268210", "model": "llama", "target_model": "llama", "recognition_score": 0.9437636564053933, "ground_truth": 1}, {"key": "40268210", "model": "llama", "target_model": "human", "recognition_score": 0.7662936484203916, "ground_truth": 0}, {"key": "40268210", "model": "llama", "target_model": "claude", "recognition_score": 0.8933094157349225, "ground_truth": 0}, {"key": "40268210", "model": "llama", "target_model": "gpt4", "recognition_score": 0.96006268968804, "ground_truth": 0}, {"key": "40268210", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9079671399467566, "ground_truth": 0}, {"key": "34925159", "model": "llama", "target_model": "llama", "recognition_score": 0.9504109739073663, "ground_truth": 1}, {"key": "34925159", "model": "llama", "target_model": "human", "recognition_score": 0.6976089146216239, "ground_truth": 0}, {"key": "34925159", "model": "llama", "target_model": "claude", "recognition_score": 0.8633916046124742, "ground_truth": 0}, {"key": "34925159", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9385759611058359, "ground_truth": 0}, {"key": "34925159", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9425067233769326, "ground_truth": 0}, {"key": "36181903", "model": "llama", "target_model": "llama", "recognition_score": 0.9683812340838096, "ground_truth": 1}, {"key": "36181903", "model": "llama", "target_model": "human", "recognition_score": 0.9815951095037803, "ground_truth": 0}, {"key": "36181903", "model": "llama", "target_model": "claude", "recognition_score": 0.9832145093707942, "ground_truth": 0}, {"key": "36181903", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9746286892833146, "ground_truth": 0}, {"key": "36181903", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9813106933104817, "ground_truth": 0}, {"key": "38620559", "model": "llama", "target_model": "llama", "recognition_score": 0.9420819137466517, "ground_truth": 1}, {"key": "38620559", "model": "llama", "target_model": "human", "recognition_score": 0.9412234427665298, "ground_truth": 0}, {"key": "38620559", "model": "llama", "target_model": "claude", "recognition_score": 0.9224823511206337, "ground_truth": 0}, {"key": "38620559", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9835969672657605, "ground_truth": 0}, {"key": "38620559", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9768465853915185, "ground_truth": 0}, {"key": "32719657", "model": "llama", "target_model": "llama", "recognition_score": 0.6584175005932872, "ground_truth": 1}, {"key": "32719657", "model": "llama", "target_model": "human", "recognition_score": 0.9314625066825407, "ground_truth": 0}, {"key": "32719657", "model": "llama", "target_model": "claude", "recognition_score": 0.7356416352047543, "ground_truth": 0}, {"key": "32719657", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7310585734164208, "ground_truth": 0}, {"key": "32719657", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6636689488054055, "ground_truth": 0}, {"key": "37530914", "model": "llama", "target_model": "llama", "recognition_score": 0.562176516935577, "ground_truth": 1}, {"key": "37530914", "model": "llama", "target_model": "human", "recognition_score": 0.656658265792485, "ground_truth": 0}, {"key": "37530914", "model": "llama", "target_model": "claude", "recognition_score": 0.7577943748037785, "ground_truth": 0}, {"key": "37530914", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8092759906054616, "ground_truth": 0}, {"key": "37530914", "model": "llama", "target_model": "gpt35", "recognition_score": 0.42823339165231533, "ground_truth": 0}, {"key": "33306933", "model": "llama", "target_model": "llama", "recognition_score": 0.8749346280593837, "ground_truth": 1}, {"key": "33306933", "model": "llama", "target_model": "human", "recognition_score": 0.9481545305629389, "ground_truth": 0}, {"key": "33306933", "model": "llama", "target_model": "claude", "recognition_score": 0.9609517057068786, "ground_truth": 0}, {"key": "33306933", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8661325143785286, "ground_truth": 0}, {"key": "33306933", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9136765275365686, "ground_truth": 0}, {"key": "33837212", "model": "llama", "target_model": "llama", "recognition_score": 0.8365545690855365, "ground_truth": 1}, {"key": "33837212", "model": "llama", "target_model": "human", "recognition_score": 0.8221891382336007, "ground_truth": 0}, {"key": "33837212", "model": "llama", "target_model": "claude", "recognition_score": 0.8918110396520892, "ground_truth": 0}, {"key": "33837212", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8925625247960844, "ground_truth": 0}, {"key": "33837212", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8652240869418669, "ground_truth": 0}, {"key": "40945179", "model": "llama", "target_model": "llama", "recognition_score": 0.7732163789592187, "ground_truth": 1}, {"key": "40945179", "model": "llama", "target_model": "human", "recognition_score": 0.6370307859455798, "ground_truth": 0}, {"key": "40945179", "model": "llama", "target_model": "claude", "recognition_score": 0.9155072470419993, "ground_truth": 0}, {"key": "40945179", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7505527650947238, "ground_truth": 0}, {"key": "40945179", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7341195317554742, "ground_truth": 0}, {"key": "34152358", "model": "llama", "target_model": "llama", "recognition_score": 0.43590151415467093, "ground_truth": 1}, {"key": "34152358", "model": "llama", "target_model": "human", "recognition_score": 0.7025300386933314, "ground_truth": 0}, {"key": "34152358", "model": "llama", "target_model": "claude", "recognition_score": 0.7905303213217126, "ground_truth": 0}, {"key": "34152358", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6132365430358558, "ground_truth": 0}, {"key": "34152358", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6566582630554607, "ground_truth": 0}, {"key": "34136541", "model": "llama", "target_model": "llama", "recognition_score": 0.9612438063757809, "ground_truth": 1}, {"key": "34136541", "model": "llama", "target_model": "human", "recognition_score": 0.9213576216121654, "ground_truth": 0}, {"key": "34136541", "model": "llama", "target_model": "claude", "recognition_score": 0.9462003557326193, "ground_truth": 0}, {"key": "34136541", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9263037270730531, "ground_truth": 0}, {"key": "34136541", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8652240838391813, "ground_truth": 0}, {"key": "37469603", "model": "llama", "target_model": "llama", "recognition_score": 0.7356416350152718, "ground_truth": 1}, {"key": "37469603", "model": "llama", "target_model": "human", "recognition_score": 0.8976953023832357, "ground_truth": 0}, {"key": "37469603", "model": "llama", "target_model": "claude", "recognition_score": 0.8955226752708195, "ground_truth": 0}, {"key": "37469603", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8624675222177159, "ground_truth": 0}, {"key": "37469603", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9053223002324541, "ground_truth": 0}, {"key": "37353611", "model": "llama", "target_model": "llama", "recognition_score": 0.982423117046509, "ground_truth": 1}, {"key": "37353611", "model": "llama", "target_model": "human", "recognition_score": 0.942081910504173, "ground_truth": 0}, {"key": "37353611", "model": "llama", "target_model": "claude", "recognition_score": 0.9441768630186393, "ground_truth": 0}, {"key": "37353611", "model": "llama", "target_model": "gpt4", "recognition_score": 0.959762058843505, "ground_truth": 0}, {"key": "37353611", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9525741296350116, "ground_truth": 0}, {"key": "37211649", "model": "llama", "target_model": "llama", "recognition_score": 0.6132365353743594, "ground_truth": 1}, {"key": "37211649", "model": "llama", "target_model": "human", "recognition_score": 0.9111797003560895, "ground_truth": 0}, {"key": "37211649", "model": "llama", "target_model": "claude", "recognition_score": 0.8848377625693854, "ground_truth": 0}, {"key": "37211649", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8175744670422114, "ground_truth": 0}, {"key": "37211649", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7943849536450454, "ground_truth": 0}, {"key": "37320976", "model": "llama", "target_model": "llama", "recognition_score": 0.8418256331784558, "ground_truth": 1}, {"key": "37320976", "model": "llama", "target_model": "human", "recognition_score": 0.8705972773332168, "ground_truth": 0}, {"key": "37320976", "model": "llama", "target_model": "claude", "recognition_score": 0.8918110463498401, "ground_truth": 0}, {"key": "37320976", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8322366548893482, "ground_truth": 0}, {"key": "37320976", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8705972546612617, "ground_truth": 0}, {"key": "34492412", "model": "llama", "target_model": "llama", "recognition_score": 0.9711290930467341, "ground_truth": 1}, {"key": "34492412", "model": "llama", "target_model": "human", "recognition_score": 0.7826624813441851, "ground_truth": 0}, {"key": "34492412", "model": "llama", "target_model": "claude", "recognition_score": 0.9911526453153442, "ground_truth": 0}, {"key": "34492412", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9500414768186106, "ground_truth": 0}, {"key": "34492412", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9563089398884753, "ground_truth": 0}, {"key": "36655016", "model": "llama", "target_model": "llama", "recognition_score": 0.9750122065016129, "ground_truth": 1}, {"key": "36655016", "model": "llama", "target_model": "human", "recognition_score": 0.9759464469794369, "ground_truth": 0}, {"key": "36655016", "model": "llama", "target_model": "claude", "recognition_score": 0.9798226815777853, "ground_truth": 0}, {"key": "36655016", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9732407186905642, "ground_truth": 0}, {"key": "36655016", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9618217205008337, "ground_truth": 0}, {"key": "35220773", "model": "llama", "target_model": "llama", "recognition_score": 0.7759445447799671, "ground_truth": 1}, {"key": "35220773", "model": "llama", "target_model": "human", "recognition_score": 0.8969755715996552, "ground_truth": 0}, {"key": "35220773", "model": "llama", "target_model": "claude", "recognition_score": 0.8872045965372104, "ground_truth": 0}, {"key": "35220773", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8705972791875911, "ground_truth": 0}, {"key": "35220773", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8344068902793023, "ground_truth": 0}, {"key": "31569808", "model": "llama", "target_model": "llama", "recognition_score": 0.7248702906981538, "ground_truth": 1}, {"key": "31569808", "model": "llama", "target_model": "human", "recognition_score": 0.6424324758450921, "ground_truth": 0}, {"key": "31569808", "model": "llama", "target_model": "claude", "recognition_score": 0.6261241882358259, "ground_truth": 0}, {"key": "31569808", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6859494523874133, "ground_truth": 0}, {"key": "31569808", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7956580986775796, "ground_truth": 0}, {"key": "37696256", "model": "llama", "target_model": "llama", "recognition_score": 0.7185943891218305, "ground_truth": 1}, {"key": "37696256", "model": "llama", "target_model": "human", "recognition_score": 0.7592253905909698, "ground_truth": 0}, {"key": "37696256", "model": "llama", "target_model": "claude", "recognition_score": 0.5409238798888362, "ground_truth": 0}, {"key": "37696256", "model": "llama", "target_model": "gpt4", "recognition_score": 0.717011871201988, "ground_truth": 0}, {"key": "37696256", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7057850253334375, "ground_truth": 0}, {"key": "36874328", "model": "llama", "target_model": "llama", "recognition_score": 0.8791467601943418, "ground_truth": 1}, {"key": "36874328", "model": "llama", "target_model": "human", "recognition_score": 0.9536217928004413, "ground_truth": 0}, {"key": "36874328", "model": "llama", "target_model": "claude", "recognition_score": 0.9202179887189036, "ground_truth": 0}, {"key": "36874328", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9246876932288868, "ground_truth": 0}, {"key": "36874328", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9416541580470333, "ground_truth": 0}, {"key": "24532377", "model": "llama", "target_model": "llama", "recognition_score": 0.35042140697214286, "ground_truth": 1}, {"key": "24532377", "model": "llama", "target_model": "human", "recognition_score": 0.4205995832222709, "ground_truth": 0}, {"key": "24532377", "model": "llama", "target_model": "claude", "recognition_score": 0.3415825173857032, "ground_truth": 0}, {"key": "24532377", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4902356280831115, "ground_truth": 0}, {"key": "24532377", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3775407019513966, "ground_truth": 0}, {"key": "39560618", "model": "llama", "target_model": "llama", "recognition_score": 0.8568122974177762, "ground_truth": 1}, {"key": "39560618", "model": "llama", "target_model": "human", "recognition_score": 0.7956581169722586, "ground_truth": 0}, {"key": "39560618", "model": "llama", "target_model": "claude", "recognition_score": 0.8221891419390484, "ground_truth": 0}, {"key": "39560618", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8438950910722178, "ground_truth": 0}, {"key": "39560618", "model": "llama", "target_model": "gpt35", "recognition_score": 0.895522672989986, "ground_truth": 0}, {"key": "34922693", "model": "llama", "target_model": "llama", "recognition_score": 0.13846179656358296, "ground_truth": 1}, {"key": "34922693", "model": "llama", "target_model": "human", "recognition_score": 0.23651622480986212, "ground_truth": 0}, {"key": "34922693", "model": "llama", "target_model": "claude", "recognition_score": 0.41111088881537966, "ground_truth": 0}, {"key": "34922693", "model": "llama", "target_model": "gpt4", "recognition_score": 0.37387580405612636, "ground_truth": 0}, {"key": "34922693", "model": "llama", "target_model": "gpt35", "recognition_score": 0.31237000145273774, "ground_truth": 0}, {"key": "33629577", "model": "llama", "target_model": "llama", "recognition_score": 0.478528829946923, "ground_truth": 1}, {"key": "33629577", "model": "llama", "target_model": "human", "recognition_score": 0.5409238794767839, "ground_truth": 0}, {"key": "33629577", "model": "llama", "target_model": "claude", "recognition_score": 0.5175709052550201, "ground_truth": 0}, {"key": "33629577", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5136684682873933, "ground_truth": 0}, {"key": "33629577", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6113819390037795, "ground_truth": 0}, {"key": "32284359", "model": "llama", "target_model": "llama", "recognition_score": 0.6842640365534993, "ground_truth": 1}, {"key": "32284359", "model": "llama", "target_model": "human", "recognition_score": 0.5717666039933293, "ground_truth": 0}, {"key": "32284359", "model": "llama", "target_model": "claude", "recognition_score": 0.7853085808671914, "ground_truth": 0}, {"key": "32284359", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7905303231099489, "ground_truth": 0}, {"key": "32284359", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8670357652306974, "ground_truth": 0}, {"key": "28082962", "model": "llama", "target_model": "llama", "recognition_score": 0.5755879868132388, "ground_truth": 1}, {"key": "28082962", "model": "llama", "target_model": "human", "recognition_score": 0.5736784161365446, "ground_truth": 0}, {"key": "28082962", "model": "llama", "target_model": "claude", "recognition_score": 0.7704647932230112, "ground_truth": 0}, {"key": "28082962", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6791787133763134, "ground_truth": 0}, {"key": "28082962", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5331543933062554, "ground_truth": 0}, {"key": "24796803", "model": "llama", "target_model": "llama", "recognition_score": 0.8104789072174481, "ground_truth": 1}, {"key": "24796803", "model": "llama", "target_model": "human", "recognition_score": 0.7074047009064525, "ground_truth": 0}, {"key": "24796803", "model": "llama", "target_model": "claude", "recognition_score": 0.6279512159146385, "ground_truth": 0}, {"key": "24796803", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7759445336277548, "ground_truth": 0}, {"key": "24796803", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8832359829849848, "ground_truth": 0}, {"key": "35466150", "model": "llama", "target_model": "llama", "recognition_score": 0.7799929167543196, "ground_truth": 1}, {"key": "35466150", "model": "llama", "target_model": "human", "recognition_score": 0.7956581101471868, "ground_truth": 0}, {"key": "35466150", "model": "llama", "target_model": "claude", "recognition_score": 0.8910549519759635, "ground_truth": 0}, {"key": "35466150", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8449215237375071, "ground_truth": 0}, {"key": "35466150", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8848377730357957, "ground_truth": 0}, {"key": "35754289", "model": "llama", "target_model": "llama", "recognition_score": 0.9425067165881731, "ground_truth": 1}, {"key": "35754289", "model": "llama", "target_model": "human", "recognition_score": 0.939470605075428, "ground_truth": 0}, {"key": "35754289", "model": "llama", "target_model": "claude", "recognition_score": 0.9385759615697141, "ground_truth": 0}, {"key": "35754289", "model": "llama", "target_model": "gpt4", "recognition_score": 0.913676524751005, "ground_truth": 0}, {"key": "35754289", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9190632901271159, "ground_truth": 0}, {"key": "36678662", "model": "llama", "target_model": "llama", "recognition_score": 0.9858276353105662, "ground_truth": 1}, {"key": "36678662", "model": "llama", "target_model": "human", "recognition_score": 0.9837225396725843, "ground_truth": 0}, {"key": "36678662", "model": "llama", "target_model": "claude", "recognition_score": 0.929440404327594, "ground_truth": 0}, {"key": "36678662", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9489172610318208, "ground_truth": 0}, {"key": "36678662", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9653811602647201, "ground_truth": 0}, {"key": "35399671", "model": "llama", "target_model": "llama", "recognition_score": 0.9543079673789842, "ground_truth": 1}, {"key": "35399671", "model": "llama", "target_model": "human", "recognition_score": 0.9196425357069656, "ground_truth": 0}, {"key": "35399671", "model": "llama", "target_model": "claude", "recognition_score": 0.9489172660439059, "ground_truth": 0}, {"key": "35399671", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9481545315217283, "ground_truth": 0}, {"key": "35399671", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9196425399277506, "ground_truth": 0}, {"key": "36888180", "model": "llama", "target_model": "llama", "recognition_score": 0.8164063696584565, "ground_truth": 1}, {"key": "36888180", "model": "llama", "target_model": "human", "recognition_score": 0.8365545678443359, "ground_truth": 0}, {"key": "36888180", "model": "llama", "target_model": "claude", "recognition_score": 0.8568122878072895, "ground_truth": 0}, {"key": "36888180", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8679338476746171, "ground_truth": 0}, {"key": "36888180", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9005297974033183, "ground_truth": 0}, {"key": "28061069", "model": "llama", "target_model": "llama", "recognition_score": 0.46295864056686764, "ground_truth": 1}, {"key": "28061069", "model": "llama", "target_model": "human", "recognition_score": 0.6876300076574636, "ground_truth": 0}, {"key": "28061069", "model": "llama", "target_model": "claude", "recognition_score": 0.6315943099897723, "ground_truth": 0}, {"key": "28061069", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6654105734214862, "ground_truth": 0}, {"key": "28061069", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4746311927889275, "ground_truth": 0}, {"key": "22259982", "model": "llama", "target_model": "llama", "recognition_score": 0.5486734837712339, "ground_truth": 1}, {"key": "22259982", "model": "llama", "target_model": "human", "recognition_score": 0.6723316907702553, "ground_truth": 0}, {"key": "22259982", "model": "llama", "target_model": "claude", "recognition_score": 0.6654105423724179, "ground_truth": 0}, {"key": "22259982", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7563575464919786, "ground_truth": 0}, {"key": "22259982", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5755879901422124, "ground_truth": 0}, {"key": "34026805", "model": "llama", "target_model": "llama", "recognition_score": 0.8848377737724546, "ground_truth": 1}, {"key": "34026805", "model": "llama", "target_model": "human", "recognition_score": 0.9556514223920709, "ground_truth": 0}, {"key": "34026805", "model": "llama", "target_model": "claude", "recognition_score": 0.9032942110302827, "ground_truth": 0}, {"key": "34026805", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9458012713000383, "ground_truth": 0}, {"key": "34026805", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9118099542592938, "ground_truth": 0}, {"key": "36713809", "model": "llama", "target_model": "llama", "recognition_score": 0.9309620739756915, "ground_truth": 1}, {"key": "36713809", "model": "llama", "target_model": "human", "recognition_score": 0.9556514203830472, "ground_truth": 0}, {"key": "36713809", "model": "llama", "target_model": "claude", "recognition_score": 0.9178933760610398, "ground_truth": 0}, {"key": "36713809", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8596637553049464, "ground_truth": 0}, {"key": "36713809", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9661559634163512, "ground_truth": 0}, {"key": "39726411", "model": "llama", "target_model": "llama", "recognition_score": 0.4551986039872955, "ground_truth": 1}, {"key": "39726411", "model": "llama", "target_model": "human", "recognition_score": 0.5195213407993059, "ground_truth": 0}, {"key": "39726411", "model": "llama", "target_model": "claude", "recognition_score": 0.732591819544931, "ground_truth": 0}, {"key": "39726411", "model": "llama", "target_model": "gpt4", "recognition_score": 0.54286328407208, "ground_truth": 0}, {"key": "39726411", "model": "llama", "target_model": "gpt35", "recognition_score": 0.37387582095508826, "ground_truth": 0}, {"key": "37069841", "model": "llama", "target_model": "llama", "recognition_score": 0.8947894680209503, "ground_truth": 1}, {"key": "37069841", "model": "llama", "target_model": "human", "recognition_score": 0.8895288454155937, "ground_truth": 0}, {"key": "37069841", "model": "llama", "target_model": "claude", "recognition_score": 0.8056321980960612, "ground_truth": 0}, {"key": "37069841", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8278281509527697, "ground_truth": 0}, {"key": "37069841", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9399133529167788, "ground_truth": 0}, {"key": "38894693", "model": "llama", "target_model": "llama", "recognition_score": 0.8749346354178801, "ground_truth": 1}, {"key": "38894693", "model": "llama", "target_model": "human", "recognition_score": 0.8278281604295418, "ground_truth": 0}, {"key": "38894693", "model": "llama", "target_model": "claude", "recognition_score": 0.7969253668192107, "ground_truth": 0}, {"key": "38894693", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8031738213507456, "ground_truth": 0}, {"key": "38894693", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8661325236736758, "ground_truth": 0}, {"key": "33946032", "model": "llama", "target_model": "llama", "recognition_score": 0.9881308778388207, "ground_truth": 1}, {"key": "33946032", "model": "llama", "target_model": "human", "recognition_score": 0.9884026379599486, "ground_truth": 0}, {"key": "33946032", "model": "llama", "target_model": "claude", "recognition_score": 0.9848109492718002, "ground_truth": 0}, {"key": "33946032", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9515039931096956, "ground_truth": 0}, {"key": "33946032", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9623913647408302, "ground_truth": 0}, {"key": "39035311", "model": "llama", "target_model": "llama", "recognition_score": 0.8116760149387032, "ground_truth": 1}, {"key": "39035311", "model": "llama", "target_model": "human", "recognition_score": 0.7732163722931863, "ground_truth": 0}, {"key": "39035311", "model": "llama", "target_model": "claude", "recognition_score": 0.809275978307401, "ground_truth": 0}, {"key": "39035311", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8624675327955549, "ground_truth": 0}, {"key": "39035311", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6825737298782663, "ground_truth": 0}, {"key": "27680038", "model": "llama", "target_model": "llama", "recognition_score": 0.5253688268711219, "ground_truth": 1}, {"key": "27680038", "model": "llama", "target_model": "human", "recognition_score": 0.42823340105200836, "ground_truth": 0}, {"key": "27680038", "model": "llama", "target_model": "claude", "recognition_score": 0.5136684769104314, "ground_truth": 0}, {"key": "27680038", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4902356319078096, "ground_truth": 0}, {"key": "27680038", "model": "llama", "target_model": "gpt35", "recognition_score": 0.22135067650079915, "ground_truth": 0}, {"key": "36901907", "model": "llama", "target_model": "llama", "recognition_score": 0.7356416310094132, "ground_truth": 1}, {"key": "36901907", "model": "llama", "target_model": "human", "recognition_score": 0.8289388096439191, "ground_truth": 0}, {"key": "36901907", "model": "llama", "target_model": "claude", "recognition_score": 0.8998277748548189, "ground_truth": 0}, {"key": "36901907", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8198933342189892, "ground_truth": 0}, {"key": "36901907", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7233094713081678, "ground_truth": 0}, {"key": "21530542", "model": "llama", "target_model": "llama", "recognition_score": 0.6723317334878423, "ground_truth": 1}, {"key": "21530542", "model": "llama", "target_model": "human", "recognition_score": 0.7386690596875138, "ground_truth": 0}, {"key": "21530542", "model": "llama", "target_model": "claude", "recognition_score": 0.6671476574940038, "ground_truth": 0}, {"key": "21530542", "model": "llama", "target_model": "gpt4", "recognition_score": 0.860603623898419, "ground_truth": 0}, {"key": "21530542", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8449215283762653, "ground_truth": 0}, {"key": "38192532", "model": "llama", "target_model": "llama", "recognition_score": 0.8397339656696627, "ground_truth": 1}, {"key": "38192532", "model": "llama", "target_model": "human", "recognition_score": 0.8714748684143141, "ground_truth": 0}, {"key": "38192532", "model": "llama", "target_model": "claude", "recognition_score": 0.9403530553821641, "ground_truth": 0}, {"key": "38192532", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8918110433544507, "ground_truth": 0}, {"key": "38192532", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8984105487387161, "ground_truth": 0}, {"key": "34102400", "model": "llama", "target_model": "llama", "recognition_score": 0.2814056256665921, "ground_truth": 1}, {"key": "34102400", "model": "llama", "target_model": "human", "recognition_score": 0.16132023842439114, "ground_truth": 0}, {"key": "34102400", "model": "llama", "target_model": "claude", "recognition_score": 0.3611646920907494, "ground_truth": 0}, {"key": "34102400", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4130035620756553, "ground_truth": 0}, {"key": "34102400", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3702254110647167, "ground_truth": 0}, {"key": "36133399", "model": "llama", "target_model": "llama", "recognition_score": 0.6039318354866957, "ground_truth": 1}, {"key": "36133399", "model": "llama", "target_model": "human", "recognition_score": 0.8509647076986607, "ground_truth": 0}, {"key": "36133399", "model": "llama", "target_model": "claude", "recognition_score": 0.9142907235117818, "ground_truth": 0}, {"key": "36133399", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8365545488633689, "ground_truth": 0}, {"key": "36133399", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8587185673469967, "ground_truth": 0}, {"key": "34314544", "model": "llama", "target_model": "llama", "recognition_score": 0.8449215221123213, "ground_truth": 1}, {"key": "34314544", "model": "llama", "target_model": "human", "recognition_score": 0.8116760148977658, "ground_truth": 0}, {"key": "34314544", "model": "llama", "target_model": "claude", "recognition_score": 0.8606036256176045, "ground_truth": 0}, {"key": "34314544", "model": "llama", "target_model": "gpt4", "recognition_score": 0.858718583621239, "ground_truth": 0}, {"key": "34314544", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8278281510271469, "ground_truth": 0}, {"key": "33460074", "model": "llama", "target_model": "llama", "recognition_score": 0.8529354838457238, "ground_truth": 1}, {"key": "33460074", "model": "llama", "target_model": "human", "recognition_score": 0.8643104450304335, "ground_truth": 0}, {"key": "33460074", "model": "llama", "target_model": "claude", "recognition_score": 0.8469578418226332, "ground_truth": 0}, {"key": "33460074", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7662936335756307, "ground_truth": 0}, {"key": "33460074", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8529354768215132, "ground_truth": 0}, {"key": "36191495", "model": "llama", "target_model": "llama", "recognition_score": 0.6757645963009229, "ground_truth": 1}, {"key": "36191495", "model": "llama", "target_model": "human", "recognition_score": 0.7918210684360173, "ground_truth": 0}, {"key": "36191495", "model": "llama", "target_model": "claude", "recognition_score": 0.7201714960395533, "ground_truth": 0}, {"key": "36191495", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6601723855087761, "ground_truth": 0}, {"key": "36191495", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7279754536082499, "ground_truth": 0}, {"key": "39532668", "model": "llama", "target_model": "llama", "recognition_score": 0.9441768585917637, "ground_truth": 1}, {"key": "39532668", "model": "llama", "target_model": "human", "recognition_score": 0.9597620603974222, "ground_truth": 0}, {"key": "39532668", "model": "llama", "target_model": "claude", "recognition_score": 0.8624675302034484, "ground_truth": 0}, {"key": "39532668", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9032942102672807, "ground_truth": 0}, {"key": "39532668", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8244619444744906, "ground_truth": 0}, {"key": "20328247", "model": "llama", "target_model": "llama", "recognition_score": 0.6242935463862196, "ground_truth": 1}, {"key": "20328247", "model": "llama", "target_model": "human", "recognition_score": 0.41300355604144945, "ground_truth": 0}, {"key": "20328247", "model": "llama", "target_model": "claude", "recognition_score": 0.4649015778643319, "ground_truth": 0}, {"key": "20328247", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5583270081631497, "ground_truth": 0}, {"key": "20328247", "model": "llama", "target_model": "gpt35", "recognition_score": 0.550607340150374, "ground_truth": 0}, {"key": "39112675", "model": "llama", "target_model": "llama", "recognition_score": 0.7386690943093184, "ground_truth": 1}, {"key": "39112675", "model": "llama", "target_model": "human", "recognition_score": 0.5058590978913096, "ground_truth": 0}, {"key": "39112675", "model": "llama", "target_model": "claude", "recognition_score": 0.680878600898707, "ground_truth": 0}, {"key": "39112675", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7853085975360681, "ground_truth": 0}, {"key": "39112675", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8749346224716595, "ground_truth": 0}, {"key": "31620300", "model": "llama", "target_model": "llama", "recognition_score": 0.7718435198904002, "ground_truth": 1}, {"key": "31620300", "model": "llama", "target_model": "human", "recognition_score": 0.7634837562555856, "ground_truth": 0}, {"key": "31620300", "model": "llama", "target_model": "claude", "recognition_score": 0.8643104368950152, "ground_truth": 0}, {"key": "31620300", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6740504751744477, "ground_truth": 0}, {"key": "31620300", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7918210854287212, "ground_truth": 0}, {"key": "37518509", "model": "llama", "target_model": "llama", "recognition_score": 0.6442250982886568, "ground_truth": 1}, {"key": "37518509", "model": "llama", "target_model": "human", "recognition_score": 0.44360042551695444, "ground_truth": 0}, {"key": "37518509", "model": "llama", "target_model": "claude", "recognition_score": 0.6566582761712441, "ground_truth": 0}, {"key": "37518509", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6859494369564895, "ground_truth": 0}, {"key": "37518509", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7264256047216745, "ground_truth": 0}, {"key": "35454095", "model": "llama", "target_model": "llama", "recognition_score": 0.8407825838951397, "ground_truth": 1}, {"key": "35454095", "model": "llama", "target_model": "human", "recognition_score": 0.9155072520784112, "ground_truth": 0}, {"key": "35454095", "model": "llama", "target_model": "claude", "recognition_score": 0.9252299641384645, "ground_truth": 0}, {"key": "35454095", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8354835428182378, "ground_truth": 0}, {"key": "35454095", "model": "llama", "target_model": "gpt35", "recognition_score": 0.874077238035572, "ground_truth": 0}, {"key": "38542788", "model": "llama", "target_model": "llama", "recognition_score": 0.9390248160899513, "ground_truth": 1}, {"key": "38542788", "model": "llama", "target_model": "human", "recognition_score": 0.9539660969210054, "ground_truth": 0}, {"key": "38542788", "model": "llama", "target_model": "claude", "recognition_score": 0.9719924841107888, "ground_truth": 0}, {"key": "38542788", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9775429497404973, "ground_truth": 0}, {"key": "38542788", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9559813519103592, "ground_truth": 0}, {"key": "23944937", "model": "llama", "target_model": "llama", "recognition_score": 0.8558511287625509, "ground_truth": 1}, {"key": "23944937", "model": "llama", "target_model": "human", "recognition_score": 0.7759445619353366, "ground_truth": 0}, {"key": "23944937", "model": "llama", "target_model": "claude", "recognition_score": 0.8428631414462466, "ground_truth": 0}, {"key": "23944937", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8428631578132345, "ground_truth": 0}, {"key": "23944937", "model": "llama", "target_model": "gpt35", "recognition_score": 0.723309483510313, "ground_truth": 0}, {"key": "31753944", "model": "llama", "target_model": "llama", "recognition_score": 0.5409238284126399, "ground_truth": 1}, {"key": "31753944", "model": "llama", "target_model": "human", "recognition_score": 0.6442251080132179, "ground_truth": 0}, {"key": "31753944", "model": "llama", "target_model": "claude", "recognition_score": 0.6495786081054893, "ground_truth": 0}, {"key": "31753944", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7185943809279863, "ground_truth": 0}, {"key": "31753944", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5660185341257984, "ground_truth": 0}, {"key": "35527214", "model": "llama", "target_model": "llama", "recognition_score": 0.8428631655767543, "ground_truth": 1}, {"key": "35527214", "model": "llama", "target_model": "human", "recognition_score": 0.8152324933305714, "ground_truth": 0}, {"key": "35527214", "model": "llama", "target_model": "claude", "recognition_score": 0.7676898672072306, "ground_truth": 0}, {"key": "35527214", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8856314685250136, "ground_truth": 0}, {"key": "35527214", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7356416434733635, "ground_truth": 0}, {"key": "40400404", "model": "llama", "target_model": "llama", "recognition_score": 0.971563969420194, "ground_truth": 1}, {"key": "40400404", "model": "llama", "target_model": "human", "recognition_score": 0.9791955093264401, "ground_truth": 0}, {"key": "40400404", "model": "llama", "target_model": "claude", "recognition_score": 0.9834704447334126, "ground_truth": 0}, {"key": "40400404", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9465966710507673, "ground_truth": 0}, {"key": "40400404", "model": "llama", "target_model": "gpt35", "recognition_score": 0.957277804861231, "ground_truth": 0}, {"key": "21713119", "model": "llama", "target_model": "llama", "recognition_score": 0.525368826309648, "ground_truth": 1}, {"key": "21713119", "model": "llama", "target_model": "human", "recognition_score": 0.35042139190279603, "ground_truth": 0}, {"key": "21713119", "model": "llama", "target_model": "claude", "recognition_score": 0.46684559338143905, "ground_truth": 0}, {"key": "21713119", "model": "llama", "target_model": "gpt4", "recognition_score": 0.49414090543360584, "ground_truth": 0}, {"key": "21713119", "model": "llama", "target_model": "gpt35", "recognition_score": 0.33111974330699084, "ground_truth": 0}, {"key": "28730678", "model": "llama", "target_model": "llama", "recognition_score": 0.9066531264543636, "ground_truth": 1}, {"key": "28730678", "model": "llama", "target_model": "human", "recognition_score": 0.8670357622151825, "ground_truth": 0}, {"key": "28730678", "model": "llama", "target_model": "claude", "recognition_score": 0.9066531223608864, "ground_truth": 0}, {"key": "28730678", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9420819088664958, "ground_truth": 0}, {"key": "28730678", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9124361581840963, "ground_truth": 0}, {"key": "36823733", "model": "llama", "target_model": "llama", "recognition_score": 0.8705972687714708, "ground_truth": 1}, {"key": "36823733", "model": "llama", "target_model": "human", "recognition_score": 0.8300437656301991, "ground_truth": 0}, {"key": "36823733", "model": "llama", "target_model": "claude", "recognition_score": 0.8509647073838098, "ground_truth": 0}, {"key": "36823733", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7813306246834273, "ground_truth": 0}, {"key": "36823733", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7446563445403304, "ground_truth": 0}, {"key": "35988862", "model": "llama", "target_model": "llama", "recognition_score": 0.33458943445496175, "ground_truth": 1}, {"key": "35988862", "model": "llama", "target_model": "human", "recognition_score": 0.43782351195927, "ground_truth": 0}, {"key": "35988862", "model": "llama", "target_model": "claude", "recognition_score": 0.5389832161512667, "ground_truth": 0}, {"key": "35988862", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6020615858427956, "ground_truth": 0}, {"key": "35988862", "model": "llama", "target_model": "gpt35", "recognition_score": 0.38861799661343216, "ground_truth": 0}, {"key": "40499665", "model": "llama", "target_model": "llama", "recognition_score": 0.971347329540424, "ground_truth": 1}, {"key": "40499665", "model": "llama", "target_model": "human", "recognition_score": 0.9403530486960736, "ground_truth": 0}, {"key": "40499665", "model": "llama", "target_model": "claude", "recognition_score": 0.905322303685009, "ground_truth": 0}, {"key": "40499665", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9768465903753071, "ground_truth": 0}, {"key": "40499665", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9525741241247467, "ground_truth": 0}, {"key": "32829820", "model": "llama", "target_model": "llama", "recognition_score": 0.8519528125439078, "ground_truth": 1}, {"key": "32829820", "model": "llama", "target_model": "human", "recognition_score": 0.7745833858146488, "ground_truth": 0}, {"key": "32829820", "model": "llama", "target_model": "claude", "recognition_score": 0.8376199716689775, "ground_truth": 0}, {"key": "32829820", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8244619228759507, "ground_truth": 0}, {"key": "32829820", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7446563505230448, "ground_truth": 0}, {"key": "20583553", "model": "llama", "target_model": "llama", "recognition_score": 0.19806416859708498, "ground_truth": 1}, {"key": "20583553", "model": "llama", "target_model": "human", "recognition_score": 0.1732882104844916, "ground_truth": 0}, {"key": "20583553", "model": "llama", "target_model": "claude", "recognition_score": 0.19930799095406837, "ground_truth": 0}, {"key": "20583553", "model": "llama", "target_model": "gpt4", "recognition_score": 0.24653332210962992, "ground_truth": 0}, {"key": "20583553", "model": "llama", "target_model": "gpt35", "recognition_score": 0.18126320783176914, "ground_truth": 0}, {"key": "30501550", "model": "llama", "target_model": "llama", "recognition_score": 0.9343951583137458, "ground_truth": 1}, {"key": "30501550", "model": "llama", "target_model": "human", "recognition_score": 0.952925821811463, "ground_truth": 0}, {"key": "30501550", "model": "llama", "target_model": "claude", "recognition_score": 0.954984469525001, "ground_truth": 0}, {"key": "30501550", "model": "llama", "target_model": "gpt4", "recognition_score": 0.93902481766908, "ground_truth": 0}, {"key": "30501550", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8397339701459352, "ground_truth": 0}, {"key": "38755897", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819489426012, "ground_truth": 1}, {"key": "38755897", "model": "llama", "target_model": "human", "recognition_score": 0.6370308071038949, "ground_truth": 0}, {"key": "38755897", "model": "llama", "target_model": "claude", "recognition_score": 0.8006920186708645, "ground_truth": 0}, {"key": "38755897", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7170118793919844, "ground_truth": 0}, {"key": "38755897", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8509647210392361, "ground_truth": 0}, {"key": "35507201", "model": "llama", "target_model": "llama", "recognition_score": 0.7490871865292583, "ground_truth": 1}, {"key": "35507201", "model": "llama", "target_model": "human", "recognition_score": 0.9142907202514975, "ground_truth": 0}, {"key": "35507201", "model": "llama", "target_model": "claude", "recognition_score": 0.9178933704457043, "ground_truth": 0}, {"key": "35507201", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8092759748419606, "ground_truth": 0}, {"key": "35507201", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8080672075959213, "ground_truth": 0}, {"key": "36453511", "model": "llama", "target_model": "llama", "recognition_score": 0.9425067232656832, "ground_truth": 1}, {"key": "36453511", "model": "llama", "target_model": "human", "recognition_score": 0.9416541631763627, "ground_truth": 0}, {"key": "36453511", "model": "llama", "target_model": "claude", "recognition_score": 0.9142907230848558, "ground_truth": 0}, {"key": "36453511", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9492946358678142, "ground_truth": 0}, {"key": "36453511", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9532750435870885, "ground_truth": 0}, {"key": "38066835", "model": "llama", "target_model": "llama", "recognition_score": 0.9079671321189139, "ground_truth": 1}, {"key": "38066835", "model": "llama", "target_model": "human", "recognition_score": 0.8244619345749002, "ground_truth": 0}, {"key": "38066835", "model": "llama", "target_model": "claude", "recognition_score": 0.851952791394042, "ground_truth": 0}, {"key": "38066835", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8661325214224704, "ground_truth": 0}, {"key": "38066835", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8933093970962188, "ground_truth": 0}, {"key": "39697181", "model": "llama", "target_model": "llama", "recognition_score": 0.6424324918390982, "ground_truth": 1}, {"key": "39697181", "model": "llama", "target_model": "human", "recognition_score": 0.5907792355817075, "ground_truth": 0}, {"key": "39697181", "model": "llama", "target_model": "claude", "recognition_score": 0.7310585788675408, "ground_truth": 0}, {"key": "39697181", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8469578459778053, "ground_truth": 0}, {"key": "39697181", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6352224117911232, "ground_truth": 0}, {"key": "21820893", "model": "llama", "target_model": "llama", "recognition_score": 0.8300437544613519, "ground_truth": 1}, {"key": "21820893", "model": "llama", "target_model": "human", "recognition_score": 0.8824278662298702, "ground_truth": 0}, {"key": "21820893", "model": "llama", "target_model": "claude", "recognition_score": 0.7745833705201168, "ground_truth": 0}, {"key": "21820893", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7201714893026835, "ground_truth": 0}, {"key": "21820893", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8652240802507232, "ground_truth": 0}, {"key": "40519933", "model": "llama", "target_model": "llama", "recognition_score": 0.8679338434532645, "ground_truth": 1}, {"key": "40519933", "model": "llama", "target_model": "human", "recognition_score": 0.7648916104280238, "ground_truth": 0}, {"key": "40519933", "model": "llama", "target_model": "claude", "recognition_score": 0.7745833799776467, "ground_truth": 0}, {"key": "40519933", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7606506654169013, "ground_truth": 0}, {"key": "40519933", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8774767834606535, "ground_truth": 0}, {"key": "30446033", "model": "llama", "target_model": "llama", "recognition_score": 0.907967138428212, "ground_truth": 1}, {"key": "30446033", "model": "llama", "target_model": "human", "recognition_score": 0.9358173553394618, "ground_truth": 0}, {"key": "30446033", "model": "llama", "target_model": "claude", "recognition_score": 0.8807970789746986, "ground_truth": 0}, {"key": "30446033", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9039745116577632, "ground_truth": 0}, {"key": "30446033", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9005297853088134, "ground_truth": 0}, {"key": "40216291", "model": "llama", "target_model": "llama", "recognition_score": 0.8255897233857824, "ground_truth": 1}, {"key": "40216291", "model": "llama", "target_model": "human", "recognition_score": 0.9190633011372958, "ground_truth": 0}, {"key": "40216291", "model": "llama", "target_model": "claude", "recognition_score": 0.9532750413094306, "ground_truth": 0}, {"key": "40216291", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9429286007275969, "ground_truth": 0}, {"key": "40216291", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9105453933175355, "ground_truth": 0}, {"key": "33479118", "model": "llama", "target_model": "llama", "recognition_score": 0.48438009999102233, "ground_truth": 1}, {"key": "33479118", "model": "llama", "target_model": "human", "recognition_score": 0.42632156078882877, "ground_truth": 0}, {"key": "33479118", "model": "llama", "target_model": "claude", "recognition_score": 0.702530038926587, "ground_truth": 0}, {"key": "33479118", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7248702683792395, "ground_truth": 0}, {"key": "33479118", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5640984984048903, "ground_truth": 0}, {"key": "22297373", "model": "llama", "target_model": "llama", "recognition_score": 0.20434189485319676, "ground_truth": 1}, {"key": "22297373", "model": "llama", "target_model": "human", "recognition_score": 0.23792987925161133, "ground_truth": 0}, {"key": "22297373", "model": "llama", "target_model": "claude", "recognition_score": 0.25683197452430423, "ground_truth": 0}, {"key": "22297373", "model": "llama", "target_model": "gpt4", "recognition_score": 0.36477756382023585, "ground_truth": 0}, {"key": "22297373", "model": "llama", "target_model": "gpt35", "recognition_score": 0.27825678809263155, "ground_truth": 0}, {"key": "36463668", "model": "llama", "target_model": "llama", "recognition_score": 0.24944722346126263, "ground_truth": 1}, {"key": "36463668", "model": "llama", "target_model": "human", "recognition_score": 0.27357438027349934, "ground_truth": 0}, {"key": "36463668", "model": "llama", "target_model": "claude", "recognition_score": 0.307358009364421, "ground_truth": 0}, {"key": "36463668", "model": "llama", "target_model": "gpt4", "recognition_score": 0.38676342410045117, "ground_truth": 0}, {"key": "36463668", "model": "llama", "target_model": "gpt35", "recognition_score": 0.21469141604167297, "ground_truth": 0}, {"key": "35264615", "model": "llama", "target_model": "llama", "recognition_score": 0.7310586037701731, "ground_truth": 1}, {"key": "35264615", "model": "llama", "target_model": "human", "recognition_score": 0.8469578341882639, "ground_truth": 0}, {"key": "35264615", "model": "llama", "target_model": "claude", "recognition_score": 0.5214711378498866, "ground_truth": 0}, {"key": "35264615", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7704647746995572, "ground_truth": 0}, {"key": "35264615", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6388352835199086, "ground_truth": 0}, {"key": "39898482", "model": "llama", "target_model": "llama", "recognition_score": 0.9635062281521131, "ground_truth": 1}, {"key": "39898482", "model": "llama", "target_model": "human", "recognition_score": 0.9704646581710618, "ground_truth": 0}, {"key": "39898482", "model": "llama", "target_model": "claude", "recognition_score": 0.9651191146500173, "ground_truth": 0}, {"key": "39898482", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9750122027265375, "ground_truth": 0}, {"key": "39898482", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9787126500726507, "ground_truth": 0}, {"key": "37228721", "model": "llama", "target_model": "llama", "recognition_score": 0.8679338363005606, "ground_truth": 1}, {"key": "37228721", "model": "llama", "target_model": "human", "recognition_score": 0.8732148318571389, "ground_truth": 0}, {"key": "37228721", "model": "llama", "target_model": "claude", "recognition_score": 0.858718572121392, "ground_truth": 0}, {"key": "37228721", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8969755684836841, "ground_truth": 0}, {"key": "37228721", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8955226828229683, "ground_truth": 0}, {"key": "24535799", "model": "llama", "target_model": "llama", "recognition_score": 0.9465966646827925, "ground_truth": 1}, {"key": "24535799", "model": "llama", "target_model": "human", "recognition_score": 0.9324533098224167, "ground_truth": 0}, {"key": "24535799", "model": "llama", "target_model": "claude", "recognition_score": 0.7295197817327274, "ground_truth": 0}, {"key": "24535799", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7446563490233746, "ground_truth": 0}, {"key": "24535799", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8289388073324802, "ground_truth": 0}, {"key": "35177759", "model": "llama", "target_model": "llama", "recognition_score": 0.8925625218870502, "ground_truth": 1}, {"key": "35177759", "model": "llama", "target_model": "human", "recognition_score": 0.9005297843197705, "ground_truth": 0}, {"key": "35177759", "model": "llama", "target_model": "claude", "recognition_score": 0.8962513680665178, "ground_truth": 0}, {"key": "35177759", "model": "llama", "target_model": "gpt4", "recognition_score": 0.91906329209203, "ground_truth": 0}, {"key": "35177759", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9130583524530032, "ground_truth": 0}, {"key": "34364829", "model": "llama", "target_model": "llama", "recognition_score": 0.638835287448363, "ground_truth": 1}, {"key": "34364829", "model": "llama", "target_model": "human", "recognition_score": 0.8577681030324084, "ground_truth": 0}, {"key": "34364829", "model": "llama", "target_model": "claude", "recognition_score": 0.6876299890220469, "ground_truth": 0}, {"key": "34364829", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7416740058480816, "ground_truth": 0}, {"key": "34364829", "model": "llama", "target_model": "gpt35", "recognition_score": 0.654894728433333, "ground_truth": 0}, {"key": "38090732", "model": "llama", "target_model": "llama", "recognition_score": 0.940789751729514, "ground_truth": 1}, {"key": "38090732", "model": "llama", "target_model": "human", "recognition_score": 0.8679338319468775, "ground_truth": 0}, {"key": "38090732", "model": "llama", "target_model": "claude", "recognition_score": 0.818736792560462, "ground_truth": 0}, {"key": "38090732", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9019206825219511, "ground_truth": 0}, {"key": "38090732", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9086178984968226, "ground_truth": 0}, {"key": "30651479", "model": "llama", "target_model": "llama", "recognition_score": 0.8164063755190688, "ground_truth": 1}, {"key": "30651479", "model": "llama", "target_model": "human", "recognition_score": 0.9319595858282973, "ground_truth": 0}, {"key": "30651479", "model": "llama", "target_model": "claude", "recognition_score": 0.7732163674431863, "ground_truth": 0}, {"key": "30651479", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8596637540409475, "ground_truth": 0}, {"key": "30651479", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9086178956124926, "ground_truth": 0}, {"key": "39380921", "model": "llama", "target_model": "llama", "recognition_score": 0.5428632759132663, "ground_truth": 1}, {"key": "39380921", "model": "llama", "target_model": "human", "recognition_score": 0.646013721135254, "ground_truth": 0}, {"key": "39380921", "model": "llama", "target_model": "claude", "recognition_score": 0.4225046342106195, "ground_truth": 0}, {"key": "39380921", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8044059124570674, "ground_truth": 0}, {"key": "39380921", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3647775589350975, "ground_truth": 0}, {"key": "39037490", "model": "llama", "target_model": "llama", "recognition_score": 0.2909808721933382, "ground_truth": 1}, {"key": "39037490", "model": "llama", "target_model": "human", "recognition_score": 0.23231016215158592, "ground_truth": 0}, {"key": "39037490", "model": "llama", "target_model": "claude", "recognition_score": 0.44360041416953644, "ground_truth": 0}, {"key": "39037490", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5774953503824231, "ground_truth": 0}, {"key": "39037490", "model": "llama", "target_model": "gpt35", "recognition_score": 0.34510527577697503, "ground_truth": 0}, {"key": "35917499", "model": "llama", "target_model": "llama", "recognition_score": 0.9046505259835806, "ground_truth": 1}, {"key": "35917499", "model": "llama", "target_model": "human", "recognition_score": 0.9263037276854967, "ground_truth": 0}, {"key": "35917499", "model": "llama", "target_model": "claude", "recognition_score": 0.9390248215173963, "ground_truth": 0}, {"key": "35917499", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8311430493198124, "ground_truth": 0}, {"key": "35917499", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9626731130231622, "ground_truth": 0}, {"key": "34908073", "model": "llama", "target_model": "llama", "recognition_score": 0.8799743725509312, "ground_truth": 1}, {"key": "34908073", "model": "llama", "target_model": "human", "recognition_score": 0.7839884673781856, "ground_truth": 0}, {"key": "34908073", "model": "llama", "target_model": "claude", "recognition_score": 0.8407825894064257, "ground_truth": 0}, {"key": "34908073", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7592254033059913, "ground_truth": 0}, {"key": "34908073", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6688802681007631, "ground_truth": 0}, {"key": "36344759", "model": "llama", "target_model": "llama", "recognition_score": 0.8774767887742242, "ground_truth": 1}, {"key": "36344759", "model": "llama", "target_model": "human", "recognition_score": 0.5253688336740168, "ground_truth": 0}, {"key": "36344759", "model": "llama", "target_model": "claude", "recognition_score": 0.8548846361145178, "ground_truth": 0}, {"key": "36344759", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8333245978727924, "ground_truth": 0}, {"key": "36344759", "model": "llama", "target_model": "gpt35", "recognition_score": 0.809275974066292, "ground_truth": 0}, {"key": "39984637", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819688512594, "ground_truth": 1}, {"key": "39984637", "model": "llama", "target_model": "human", "recognition_score": 0.8615382117124337, "ground_truth": 0}, {"key": "39984637", "model": "llama", "target_model": "claude", "recognition_score": 0.6688802483412434, "ground_truth": 0}, {"key": "39984637", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6020615807345213, "ground_truth": 0}, {"key": "39984637", "model": "llama", "target_model": "gpt35", "recognition_score": 0.590779196743387, "ground_truth": 0}, {"key": "17917326", "model": "llama", "target_model": "llama", "recognition_score": 0.554470453700824, "ground_truth": 1}, {"key": "17917326", "model": "llama", "target_model": "human", "recognition_score": 0.49609384988564564, "ground_truth": 0}, {"key": "17917326", "model": "llama", "target_model": "claude", "recognition_score": 0.7248702643321484, "ground_truth": 0}, {"key": "17917326", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7138307611228227, "ground_truth": 0}, {"key": "17917326", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4148988430638386, "ground_truth": 0}, {"key": "32193638", "model": "llama", "target_model": "llama", "recognition_score": 0.7648916190341448, "ground_truth": 1}, {"key": "32193638", "model": "llama", "target_model": "human", "recognition_score": 0.8697145817516589, "ground_truth": 0}, {"key": "32193638", "model": "llama", "target_model": "claude", "recognition_score": 0.8255897214561342, "ground_truth": 0}, {"key": "32193638", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8175744829303553, "ground_truth": 0}, {"key": "32193638", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8044059237849445, "ground_truth": 0}, {"key": "34564692", "model": "llama", "target_model": "llama", "recognition_score": 0.87234737269238, "ground_truth": 1}, {"key": "34564692", "model": "llama", "target_model": "human", "recognition_score": 0.8783142438701104, "ground_truth": 0}, {"key": "34564692", "model": "llama", "target_model": "claude", "recognition_score": 0.8984105504910964, "ground_truth": 0}, {"key": "34564692", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9124361535023939, "ground_truth": 0}, {"key": "34564692", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8152324814598894, "ground_truth": 0}, {"key": "39329284", "model": "llama", "target_model": "llama", "recognition_score": 0.9873750514658666, "ground_truth": 1}, {"key": "39329284", "model": "llama", "target_model": "human", "recognition_score": 0.8910549528710436, "ground_truth": 0}, {"key": "39329284", "model": "llama", "target_model": "claude", "recognition_score": 0.976669232080423, "ground_truth": 0}, {"key": "39329284", "model": "llama", "target_model": "gpt4", "recognition_score": 0.983596968453192, "ground_truth": 0}, {"key": "39329284", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9874720654844296, "ground_truth": 0}, {"key": "37438541", "model": "llama", "target_model": "llama", "recognition_score": 0.7090191290409092, "ground_truth": 1}, {"key": "37438541", "model": "llama", "target_model": "human", "recognition_score": 0.8587185796764831, "ground_truth": 0}, {"key": "37438541", "model": "llama", "target_model": "claude", "recognition_score": 0.5869964165618559, "ground_truth": 0}, {"key": "37438541", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7248702744180568, "ground_truth": 0}, {"key": "37438541", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5370413915689451, "ground_truth": 0}, {"key": "34652757", "model": "llama", "target_model": "llama", "recognition_score": 0.917302662258505, "ground_truth": 1}, {"key": "34652757", "model": "llama", "target_model": "human", "recognition_score": 0.9299510448423459, "ground_truth": 0}, {"key": "34652757", "model": "llama", "target_model": "claude", "recognition_score": 0.9059898218747062, "ground_truth": 0}, {"key": "34652757", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9184802485358416, "ground_truth": 0}, {"key": "34652757", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9079671401284617, "ground_truth": 0}, {"key": "31361004", "model": "llama", "target_model": "llama", "recognition_score": 0.7577943741824503, "ground_truth": 1}, {"key": "31361004", "model": "llama", "target_model": "human", "recognition_score": 0.7620701207586796, "ground_truth": 0}, {"key": "31361004", "model": "llama", "target_model": "claude", "recognition_score": 0.9477691466691156, "ground_truth": 0}, {"key": "31361004", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8991213831722951, "ground_truth": 0}, {"key": "31361004", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9485372337762921, "ground_truth": 0}, {"key": "26150727", "model": "llama", "target_model": "llama", "recognition_score": 0.5409238848120812, "ground_truth": 1}, {"key": "26150727", "model": "llama", "target_model": "human", "recognition_score": 0.6531269292783671, "ground_truth": 0}, {"key": "26150727", "model": "llama", "target_model": "claude", "recognition_score": 0.5506073539536787, "ground_truth": 0}, {"key": "26150727", "model": "llama", "target_model": "gpt4", "recognition_score": 0.59643313015334, "ground_truth": 0}, {"key": "26150727", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5774953828468515, "ground_truth": 0}, {"key": "36997402", "model": "llama", "target_model": "llama", "recognition_score": 0.8519527954199478, "ground_truth": 1}, {"key": "36997402", "model": "llama", "target_model": "human", "recognition_score": 0.8529354877958557, "ground_truth": 0}, {"key": "36997402", "model": "llama", "target_model": "claude", "recognition_score": 0.8152324882096342, "ground_truth": 0}, {"key": "36997402", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8152324701012303, "ground_truth": 0}, {"key": "36997402", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8969755735051327, "ground_truth": 0}, {"key": "37430643", "model": "llama", "target_model": "llama", "recognition_score": 0.6893056248111964, "ground_truth": 1}, {"key": "37430643", "model": "llama", "target_model": "human", "recognition_score": 0.7956580822186946, "ground_truth": 0}, {"key": "37430643", "model": "llama", "target_model": "claude", "recognition_score": 0.7563575530541168, "ground_truth": 0}, {"key": "37430643", "model": "llama", "target_model": "gpt4", "recognition_score": 0.603931813629643, "ground_truth": 0}, {"key": "37430643", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8056321795530382, "ground_truth": 0}, {"key": "36964631", "model": "llama", "target_model": "llama", "recognition_score": 0.712232197064976, "ground_truth": 1}, {"key": "36964631", "model": "llama", "target_model": "human", "recognition_score": 0.8221891269932207, "ground_truth": 0}, {"key": "36964631", "model": "llama", "target_model": "claude", "recognition_score": 0.7931059507413566, "ground_truth": 0}, {"key": "36964631", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8933094017901767, "ground_truth": 0}, {"key": "36964631", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8529354751552713, "ground_truth": 0}, {"key": "35502013", "model": "llama", "target_model": "llama", "recognition_score": 0.8322366560411627, "ground_truth": 1}, {"key": "35502013", "model": "llama", "target_model": "human", "recognition_score": 0.8548846384650785, "ground_truth": 0}, {"key": "35502013", "model": "llama", "target_model": "claude", "recognition_score": 0.8376199713649025, "ground_truth": 0}, {"key": "35502013", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8428631312427498, "ground_truth": 0}, {"key": "35502013", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8322366445784464, "ground_truth": 0}, {"key": "33987664", "model": "llama", "target_model": "llama", "recognition_score": 0.9202179835455123, "ground_truth": 1}, {"key": "33987664", "model": "llama", "target_model": "human", "recognition_score": 0.9304582533959996, "ground_truth": 0}, {"key": "33987664", "model": "llama", "target_model": "claude", "recognition_score": 0.9196425330335444, "ground_truth": 0}, {"key": "33987664", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9118099547534247, "ground_truth": 0}, {"key": "33987664", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8940517050189011, "ground_truth": 0}, {"key": "35203721", "model": "llama", "target_model": "llama", "recognition_score": 0.7371581733571834, "ground_truth": 1}, {"key": "35203721", "model": "llama", "target_model": "human", "recognition_score": 0.5370413858195386, "ground_truth": 0}, {"key": "35203721", "model": "llama", "target_model": "claude", "recognition_score": 0.6688802606619737, "ground_truth": 0}, {"key": "35203721", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6876299993840547, "ground_truth": 0}, {"key": "35203721", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6671477034027626, "ground_truth": 0}, {"key": "39028348", "model": "llama", "target_model": "llama", "recognition_score": 0.8856314734275669, "ground_truth": 1}, {"key": "39028348", "model": "llama", "target_model": "human", "recognition_score": 0.7786493211585557, "ground_truth": 0}, {"key": "39028348", "model": "llama", "target_model": "claude", "recognition_score": 0.9532750435071025, "ground_truth": 0}, {"key": "39028348", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9092645086619585, "ground_truth": 0}, {"key": "39028348", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8587185920550895, "ground_truth": 0}, {"key": "37459383", "model": "llama", "target_model": "llama", "recognition_score": 0.8732148255097637, "ground_truth": 1}, {"key": "37459383", "model": "llama", "target_model": "human", "recognition_score": 0.8643104605406615, "ground_truth": 0}, {"key": "37459383", "model": "llama", "target_model": "claude", "recognition_score": 0.952925821677788, "ground_truth": 0}, {"key": "37459383", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9433475725748453, "ground_truth": 0}, {"key": "37459383", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9390248194186375, "ground_truth": 0}, {"key": "34020070", "model": "llama", "target_model": "llama", "recognition_score": 0.6406358422249289, "ground_truth": 1}, {"key": "34020070", "model": "llama", "target_model": "human", "recognition_score": 0.6825737558663767, "ground_truth": 0}, {"key": "34020070", "model": "llama", "target_model": "claude", "recognition_score": 0.8198933527664064, "ground_truth": 0}, {"key": "34020070", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5851011368986463, "ground_truth": 0}, {"key": "34020070", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7341195271301012, "ground_truth": 0}, {"key": "35176615", "model": "llama", "target_model": "llama", "recognition_score": 0.8092759643949566, "ground_truth": 1}, {"key": "35176615", "model": "llama", "target_model": "human", "recognition_score": 0.6261241722114679, "ground_truth": 0}, {"key": "35176615", "model": "llama", "target_model": "claude", "recognition_score": 0.8128673155879673, "ground_truth": 0}, {"key": "35176615", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8633916055056617, "ground_truth": 0}, {"key": "35176615", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7956580902235507, "ground_truth": 0}, {"key": "33296389", "model": "llama", "target_model": "llama", "recognition_score": 0.9263037302733853, "ground_truth": 1}, {"key": "33296389", "model": "llama", "target_model": "human", "recognition_score": 0.8879840412885732, "ground_truth": 0}, {"key": "33296389", "model": "llama", "target_model": "claude", "recognition_score": 0.8910549450198031, "ground_truth": 0}, {"key": "33296389", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9314625058975554, "ground_truth": 0}, {"key": "33296389", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8991213759518842, "ground_truth": 0}, {"key": "35399504", "model": "llama", "target_model": "llama", "recognition_score": 0.976846588717862, "ground_truth": 1}, {"key": "35399504", "model": "llama", "target_model": "human", "recognition_score": 0.9804313252805678, "ground_truth": 0}, {"key": "35399504", "model": "llama", "target_model": "claude", "recognition_score": 0.9870795285424157, "ground_truth": 0}, {"key": "35399504", "model": "llama", "target_model": "gpt4", "recognition_score": 0.987472068317737, "ground_truth": 0}, {"key": "35399504", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9511422195478726, "ground_truth": 0}, {"key": "34807886", "model": "llama", "target_model": "llama", "recognition_score": 0.6113819629548657, "ground_truth": 1}, {"key": "34807886", "model": "llama", "target_model": "human", "recognition_score": 0.41869690591035585, "ground_truth": 0}, {"key": "34807886", "model": "llama", "target_model": "claude", "recognition_score": 0.46879063131634846, "ground_truth": 0}, {"key": "34807886", "model": "llama", "target_model": "gpt4", "recognition_score": 0.64601368583077, "ground_truth": 0}, {"key": "34807886", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4073334188461481, "ground_truth": 0}, {"key": "37629813", "model": "llama", "target_model": "llama", "recognition_score": 0.8740772342061798, "ground_truth": 1}, {"key": "37629813", "model": "llama", "target_model": "human", "recognition_score": 0.7386691005552868, "ground_truth": 0}, {"key": "37629813", "model": "llama", "target_model": "claude", "recognition_score": 0.8947894619241433, "ground_truth": 0}, {"key": "37629813", "model": "llama", "target_model": "gpt4", "recognition_score": 0.937668959592599, "ground_truth": 0}, {"key": "37629813", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8568122886044188, "ground_truth": 0}, {"key": "28084389", "model": "llama", "target_model": "llama", "recognition_score": 0.8864204130568174, "ground_truth": 1}, {"key": "28084389", "model": "llama", "target_model": "human", "recognition_score": 0.9092645119327271, "ground_truth": 0}, {"key": "28084389", "model": "llama", "target_model": "claude", "recognition_score": 0.7918210705084106, "ground_truth": 0}, {"key": "28084389", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9658995770359361, "ground_truth": 0}, {"key": "28084389", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9664104961547013, "ground_truth": 0}, {"key": "35391734", "model": "llama", "target_model": "llama", "recognition_score": 0.8723473621906249, "ground_truth": 1}, {"key": "35391734", "model": "llama", "target_model": "human", "recognition_score": 0.8783142593965575, "ground_truth": 0}, {"key": "35391734", "model": "llama", "target_model": "claude", "recognition_score": 0.8816149013536261, "ground_truth": 0}, {"key": "35391734", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8397339631478882, "ground_truth": 0}, {"key": "35391734", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8799743695263428, "ground_truth": 0}, {"key": "40214591", "model": "llama", "target_model": "llama", "recognition_score": 0.7106283033276765, "ground_truth": 1}, {"key": "40214591", "model": "llama", "target_model": "human", "recognition_score": 0.7732163521417331, "ground_truth": 0}, {"key": "40214591", "model": "llama", "target_model": "claude", "recognition_score": 0.7122321801271152, "ground_truth": 0}, {"key": "40214591", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7690802259561033, "ground_truth": 0}, {"key": "40214591", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7154240254670989, "ground_truth": 0}, {"key": "26283171", "model": "llama", "target_model": "llama", "recognition_score": 0.8910549633892665, "ground_truth": 1}, {"key": "26283171", "model": "llama", "target_model": "human", "recognition_score": 0.814052804292198, "ground_truth": 0}, {"key": "26283171", "model": "llama", "target_model": "claude", "recognition_score": 0.8397339612179446, "ground_truth": 0}, {"key": "26283171", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8019358323591157, "ground_truth": 0}, {"key": "26283171", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8887587914433482, "ground_truth": 0}, {"key": "37084030", "model": "llama", "target_model": "llama", "recognition_score": 0.28298813525805466, "ground_truth": 1}, {"key": "37084030", "model": "llama", "target_model": "human", "recognition_score": 0.32594950809875745, "ground_truth": 0}, {"key": "37084030", "model": "llama", "target_model": "claude", "recognition_score": 0.45132651648023936, "ground_truth": 0}, {"key": "37084030", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3738758338655676, "ground_truth": 0}, {"key": "37084030", "model": "llama", "target_model": "gpt35", "recognition_score": 0.29910517332565467, "ground_truth": 0}, {"key": "39027295", "model": "llama", "target_model": "llama", "recognition_score": 0.33807711722790124, "ground_truth": 1}, {"key": "39027295", "model": "llama", "target_model": "human", "recognition_score": 0.6315942894130792, "ground_truth": 0}, {"key": "39027295", "model": "llama", "target_model": "claude", "recognition_score": 0.7185944079556722, "ground_truth": 0}, {"key": "39027295", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6352224437241959, "ground_truth": 0}, {"key": "39027295", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6992544244944547, "ground_truth": 0}, {"key": "14018647", "model": "llama", "target_model": "llama", "recognition_score": 0.4902355991200126, "ground_truth": 1}, {"key": "14018647", "model": "llama", "target_model": "human", "recognition_score": 0.27825679542411585, "ground_truth": 0}, {"key": "14018647", "model": "llama", "target_model": "claude", "recognition_score": 0.6442251286464322, "ground_truth": 0}, {"key": "14018647", "model": "llama", "target_model": "gpt4", "recognition_score": 0.49804688832042693, "ground_truth": 0}, {"key": "14018647", "model": "llama", "target_model": "gpt35", "recognition_score": 0.40544875367939126, "ground_truth": 0}, {"key": "37424289", "model": "llama", "target_model": "llama", "recognition_score": 0.9553191286957265, "ground_truth": 1}, {"key": "37424289", "model": "llama", "target_model": "human", "recognition_score": 0.9880389008054657, "ground_truth": 0}, {"key": "37424289", "model": "llama", "target_model": "claude", "recognition_score": 0.9579122745196074, "ground_truth": 0}, {"key": "37424289", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9814534363479823, "ground_truth": 0}, {"key": "37424289", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9600626901136603, "ground_truth": 0}, {"key": "37498031", "model": "llama", "target_model": "llama", "recognition_score": 0.7676898654033535, "ground_truth": 1}, {"key": "37498031", "model": "llama", "target_model": "human", "recognition_score": 0.7943849478010883, "ground_truth": 0}, {"key": "37498031", "model": "llama", "target_model": "claude", "recognition_score": 0.7074046759024322, "ground_truth": 0}, {"key": "37498031", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8969755715927004, "ground_truth": 0}, {"key": "37498031", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8322366432829541, "ground_truth": 0}, {"key": "30104095", "model": "llama", "target_model": "llama", "recognition_score": 0.778649326804017, "ground_truth": 1}, {"key": "30104095", "model": "llama", "target_model": "human", "recognition_score": 0.8354835240125725, "ground_truth": 0}, {"key": "30104095", "model": "llama", "target_model": "claude", "recognition_score": 0.6774740292323044, "ground_truth": 0}, {"key": "30104095", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7201714933710827, "ground_truth": 0}, {"key": "30104095", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8311430516495634, "ground_truth": 0}, {"key": "37911407", "model": "llama", "target_model": "llama", "recognition_score": 0.9556514179730148, "ground_truth": 1}, {"key": "37911407", "model": "llama", "target_model": "human", "recognition_score": 0.9863631643914028, "ground_truth": 0}, {"key": "37911407", "model": "llama", "target_model": "claude", "recognition_score": 0.9518632290630593, "ground_truth": 0}, {"key": "37911407", "model": "llama", "target_model": "gpt4", "recognition_score": 0.98058065123711, "ground_truth": 0}, {"key": "37911407", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9656413068071169, "ground_truth": 0}, {"key": "39177472", "model": "llama", "target_model": "llama", "recognition_score": 0.7956580888876427, "ground_truth": 1}, {"key": "39177472", "model": "llama", "target_model": "human", "recognition_score": 0.8244619386322634, "ground_truth": 0}, {"key": "39177472", "model": "llama", "target_model": "claude", "recognition_score": 0.9155072417022587, "ground_truth": 0}, {"key": "39177472", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8479677655163176, "ground_truth": 0}, {"key": "39177472", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8824278714470548, "ground_truth": 0}, {"key": "32325454", "model": "llama", "target_model": "llama", "recognition_score": 0.9591542869087233, "ground_truth": 1}, {"key": "32325454", "model": "llama", "target_model": "human", "recognition_score": 0.9066531234852183, "ground_truth": 0}, {"key": "32325454", "model": "llama", "target_model": "claude", "recognition_score": 0.932453308245608, "ground_truth": 0}, {"key": "32325454", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9304582556291173, "ground_truth": 0}, {"key": "32325454", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9202179898876355, "ground_truth": 0}, {"key": "38395319", "model": "llama", "target_model": "llama", "recognition_score": 0.8757869762960999, "ground_truth": 1}, {"key": "38395319", "model": "llama", "target_model": "human", "recognition_score": 0.8783142339771935, "ground_truth": 0}, {"key": "38395319", "model": "llama", "target_model": "claude", "recognition_score": 0.8679338454111033, "ground_truth": 0}, {"key": "38395319", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9190632832340765, "ground_truth": 0}, {"key": "38395319", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8311430253075324, "ground_truth": 0}, {"key": "38235895", "model": "llama", "target_model": "llama", "recognition_score": 0.45713674034529755, "ground_truth": 1}, {"key": "38235895", "model": "llama", "target_model": "human", "recognition_score": 0.513668446114497, "ground_truth": 0}, {"key": "38235895", "model": "llama", "target_model": "claude", "recognition_score": 0.5175708889327385, "ground_truth": 0}, {"key": "38235895", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5467381369825676, "ground_truth": 0}, {"key": "38235895", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6808786157422567, "ground_truth": 0}, {"key": "26543267", "model": "llama", "target_model": "llama", "recognition_score": 0.795658119403689, "ground_truth": 1}, {"key": "26543267", "model": "llama", "target_model": "human", "recognition_score": 0.724870290335485, "ground_truth": 0}, {"key": "26543267", "model": "llama", "target_model": "claude", "recognition_score": 0.6424324827752049, "ground_truth": 0}, {"key": "26543267", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7233094656861985, "ground_truth": 0}, {"key": "26543267", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6548947134679577, "ground_truth": 0}, {"key": "39054728", "model": "llama", "target_model": "llama", "recognition_score": 0.9875683492091227, "ground_truth": 1}, {"key": "39054728", "model": "llama", "target_model": "human", "recognition_score": 0.9853843304476047, "ground_truth": 0}, {"key": "39054728", "model": "llama", "target_model": "claude", "recognition_score": 0.9742394402314162, "ground_truth": 0}, {"key": "39054728", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9842154393438393, "ground_truth": 0}, {"key": "39054728", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9894295121837667, "ground_truth": 0}, {"key": "39158443", "model": "llama", "target_model": "llama", "recognition_score": 0.882427870100491, "ground_truth": 1}, {"key": "39158443", "model": "llama", "target_model": "human", "recognition_score": 0.9385759603103737, "ground_truth": 0}, {"key": "39158443", "model": "llama", "target_model": "claude", "recognition_score": 0.8529354858136813, "ground_truth": 0}, {"key": "39158443", "model": "llama", "target_model": "gpt4", "recognition_score": 0.92840879440383, "ground_truth": 0}, {"key": "39158443", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9314625052286214, "ground_truth": 0}, {"key": "36254201", "model": "llama", "target_model": "llama", "recognition_score": 0.40733338936341, "ground_truth": 1}, {"key": "36254201", "model": "llama", "target_model": "human", "recognition_score": 0.35398628268441207, "ground_truth": 0}, {"key": "36254201", "model": "llama", "target_model": "claude", "recognition_score": 0.5525396965339551, "ground_truth": 0}, {"key": "36254201", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4301473146293366, "ground_truth": 0}, {"key": "36254201", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5888891357866378, "ground_truth": 0}, {"key": "23434347", "model": "llama", "target_model": "llama", "recognition_score": 0.8469578249300255, "ground_truth": 1}, {"key": "23434347", "model": "llama", "target_model": "human", "recognition_score": 0.4551986072296152, "ground_truth": 0}, {"key": "23434347", "model": "llama", "target_model": "claude", "recognition_score": 0.8354835176308792, "ground_truth": 0}, {"key": "23434347", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7446563374612747, "ground_truth": 0}, {"key": "23434347", "model": "llama", "target_model": "gpt35", "recognition_score": 0.849971179011304, "ground_truth": 0}, {"key": "34397620", "model": "llama", "target_model": "llama", "recognition_score": 0.5869964526812995, "ground_truth": 1}, {"key": "34397620", "model": "llama", "target_model": "human", "recognition_score": 0.5640985126596035, "ground_truth": 0}, {"key": "34397620", "model": "llama", "target_model": "claude", "recognition_score": 0.5136684737382334, "ground_truth": 0}, {"key": "34397620", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5389832283760864, "ground_truth": 0}, {"key": "34397620", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5907792033815579, "ground_truth": 0}, {"key": "34340916", "model": "llama", "target_model": "llama", "recognition_score": 0.8864204082656219, "ground_truth": 1}, {"key": "34340916", "model": "llama", "target_model": "human", "recognition_score": 0.5583269752038992, "ground_truth": 0}, {"key": "34340916", "model": "llama", "target_model": "claude", "recognition_score": 0.8068526080437924, "ground_truth": 0}, {"key": "34340916", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8489721919235611, "ground_truth": 0}, {"key": "34340916", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7476159489965165, "ground_truth": 0}, {"key": "30375089", "model": "llama", "target_model": "llama", "recognition_score": 0.8705972654569528, "ground_truth": 1}, {"key": "30375089", "model": "llama", "target_model": "human", "recognition_score": 0.8311430484230392, "ground_truth": 0}, {"key": "30375089", "model": "llama", "target_model": "claude", "recognition_score": 0.8221891266068568, "ground_truth": 0}, {"key": "30375089", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7745833787780553, "ground_truth": 0}, {"key": "30375089", "model": "llama", "target_model": "gpt35", "recognition_score": 0.866132518258377, "ground_truth": 0}, {"key": "35807797", "model": "llama", "target_model": "llama", "recognition_score": 0.9079671439915946, "ground_truth": 1}, {"key": "35807797", "model": "llama", "target_model": "human", "recognition_score": 0.7446563408375586, "ground_truth": 0}, {"key": "35807797", "model": "llama", "target_model": "claude", "recognition_score": 0.9105453944597883, "ground_truth": 0}, {"key": "35807797", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8925625162983862, "ground_truth": 0}, {"key": "35807797", "model": "llama", "target_model": "gpt35", "recognition_score": 0.94334757256712, "ground_truth": 0}, {"key": "34188172", "model": "llama", "target_model": "llama", "recognition_score": 0.8947894549186767, "ground_truth": 1}, {"key": "34188172", "model": "llama", "target_model": "human", "recognition_score": 0.7122321689728646, "ground_truth": 0}, {"key": "34188172", "model": "llama", "target_model": "claude", "recognition_score": 0.8539127672747031, "ground_truth": 0}, {"key": "34188172", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8856314823084489, "ground_truth": 0}, {"key": "34188172", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7577943543638522, "ground_truth": 0}, {"key": "37075567", "model": "llama", "target_model": "llama", "recognition_score": 0.968141143097386, "ground_truth": 1}, {"key": "37075567", "model": "llama", "target_model": "human", "recognition_score": 0.9706877703841184, "ground_truth": 0}, {"key": "37075567", "model": "llama", "target_model": "claude", "recognition_score": 0.9734434314011153, "ground_truth": 0}, {"key": "37075567", "model": "llama", "target_model": "gpt4", "recognition_score": 0.95077788968945, "ground_truth": 0}, {"key": "37075567", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9648551542998881, "ground_truth": 0}, {"key": "35559735", "model": "llama", "target_model": "llama", "recognition_score": 0.8705972700647765, "ground_truth": 1}, {"key": "35559735", "model": "llama", "target_model": "human", "recognition_score": 0.8933094089822021, "ground_truth": 0}, {"key": "35559735", "model": "llama", "target_model": "claude", "recognition_score": 0.8128673198002857, "ground_truth": 0}, {"key": "35559735", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9161096055052506, "ground_truth": 0}, {"key": "35559735", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9073122263320506, "ground_truth": 0}, {"key": "33005019", "model": "llama", "target_model": "llama", "recognition_score": 0.6791786828743342, "ground_truth": 1}, {"key": "33005019", "model": "llama", "target_model": "human", "recognition_score": 0.5234203544007505, "ground_truth": 0}, {"key": "33005019", "model": "llama", "target_model": "claude", "recognition_score": 0.8397339625820622, "ground_truth": 0}, {"key": "33005019", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8606036191331649, "ground_truth": 0}, {"key": "33005019", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8577681131994812, "ground_truth": 0}, {"key": "30808252", "model": "llama", "target_model": "llama", "recognition_score": 0.654894715210702, "ground_truth": 1}, {"key": "30808252", "model": "llama", "target_model": "human", "recognition_score": 0.7634837698582357, "ground_truth": 0}, {"key": "30808252", "model": "llama", "target_model": "claude", "recognition_score": 0.6548947355233911, "ground_truth": 0}, {"key": "30808252", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7401743676890937, "ground_truth": 0}, {"key": "30808252", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6076631822932531, "ground_truth": 0}, {"key": "15159017", "model": "llama", "target_model": "llama", "recognition_score": 0.8688267860841163, "ground_truth": 1}, {"key": "15159017", "model": "llama", "target_model": "human", "recognition_score": 0.9026095995115333, "ground_truth": 0}, {"key": "15159017", "model": "llama", "target_model": "claude", "recognition_score": 0.8969755679608504, "ground_truth": 0}, {"key": "15159017", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9105453911456819, "ground_truth": 0}, {"key": "15159017", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8940517125293953, "ground_truth": 0}, {"key": "24493400", "model": "llama", "target_model": "llama", "recognition_score": 0.4824290822670282, "ground_truth": 1}, {"key": "24493400", "model": "llama", "target_model": "human", "recognition_score": 0.6206216249091863, "ground_truth": 0}, {"key": "24493400", "model": "llama", "target_model": "claude", "recognition_score": 0.6636689500783056, "ground_truth": 0}, {"key": "24493400", "model": "llama", "target_model": "gpt4", "recognition_score": 0.537041372861368, "ground_truth": 0}, {"key": "24493400", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6825737299080602, "ground_truth": 0}, {"key": "37791071", "model": "llama", "target_model": "llama", "recognition_score": 0.8128673159390792, "ground_truth": 1}, {"key": "37791071", "model": "llama", "target_model": "human", "recognition_score": 0.8732148295478667, "ground_truth": 0}, {"key": "37791071", "model": "llama", "target_model": "claude", "recognition_score": 0.9594592623151882, "ground_truth": 0}, {"key": "37791071", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9615338046102205, "ground_truth": 0}, {"key": "37791071", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9536218006612981, "ground_truth": 0}, {"key": "33528627", "model": "llama", "target_model": "llama", "recognition_score": 0.9621075768479167, "ground_truth": 1}, {"key": "33528627", "model": "llama", "target_model": "human", "recognition_score": 0.8175745019212848, "ground_truth": 0}, {"key": "33528627", "model": "llama", "target_model": "claude", "recognition_score": 0.9343951655565611, "ground_truth": 0}, {"key": "33528627", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8633916119768226, "ground_truth": 0}, {"key": "33528627", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9235923093382924, "ground_truth": 0}, {"key": "39925662", "model": "llama", "target_model": "llama", "recognition_score": 0.9196425266961034, "ground_truth": 1}, {"key": "39925662", "model": "llama", "target_model": "human", "recognition_score": 0.948917265817648, "ground_truth": 0}, {"key": "39925662", "model": "llama", "target_model": "claude", "recognition_score": 0.9465966625507712, "ground_truth": 0}, {"key": "39925662", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9585377231475614, "ground_truth": 0}, {"key": "39925662", "model": "llama", "target_model": "gpt35", "recognition_score": 0.928408792532324, "ground_truth": 0}, {"key": "29213416", "model": "llama", "target_model": "llama", "recognition_score": 0.6531269011990343, "ground_truth": 1}, {"key": "29213416", "model": "llama", "target_model": "human", "recognition_score": 0.5506073643975087, "ground_truth": 0}, {"key": "29213416", "model": "llama", "target_model": "claude", "recognition_score": 0.5136684894123764, "ground_truth": 0}, {"key": "29213416", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7325918465703608, "ground_truth": 0}, {"key": "29213416", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5907791976317086, "ground_truth": 0}, {"key": "34492745", "model": "llama", "target_model": "llama", "recognition_score": 0.6548947136738198, "ground_truth": 1}, {"key": "34492745", "model": "llama", "target_model": "human", "recognition_score": 0.4148988365421271, "ground_truth": 0}, {"key": "34492745", "model": "llama", "target_model": "claude", "recognition_score": 0.682573746136637, "ground_truth": 0}, {"key": "34492745", "model": "llama", "target_model": "gpt4", "recognition_score": 0.812867314977832, "ground_truth": 0}, {"key": "34492745", "model": "llama", "target_model": "gpt35", "recognition_score": 0.789233692078881, "ground_truth": 0}, {"key": "34191937", "model": "llama", "target_model": "llama", "recognition_score": 0.8044059236602973, "ground_truth": 1}, {"key": "34191937", "model": "llama", "target_model": "human", "recognition_score": 0.5156199292826947, "ground_truth": 0}, {"key": "34191937", "model": "llama", "target_model": "claude", "recognition_score": 0.6601723730550975, "ground_truth": 0}, {"key": "34191937", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7461389984672671, "ground_truth": 0}, {"key": "34191937", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6315942949197969, "ground_truth": 0}, {"key": "34933372", "model": "llama", "target_model": "llama", "recognition_score": 0.9219218334062731, "ground_truth": 1}, {"key": "34933372", "model": "llama", "target_model": "human", "recognition_score": 0.8714748700274867, "ground_truth": 0}, {"key": "34933372", "model": "llama", "target_model": "claude", "recognition_score": 0.8529354922719364, "ground_truth": 0}, {"key": "34933372", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8606036121891197, "ground_truth": 0}, {"key": "34933372", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9334308093689122, "ground_truth": 0}, {"key": "38714379", "model": "llama", "target_model": "llama", "recognition_score": 0.9724147181116679, "ground_truth": 1}, {"key": "38714379", "model": "llama", "target_model": "human", "recognition_score": 0.9615338102910386, "ground_truth": 0}, {"key": "38714379", "model": "llama", "target_model": "claude", "recognition_score": 0.9273632900698711, "ground_truth": 0}, {"key": "38714379", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9697854093988019, "ground_truth": 0}, {"key": "38714379", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9728307680797179, "ground_truth": 0}, {"key": "39220660", "model": "llama", "target_model": "llama", "recognition_score": 0.8397339601610798, "ground_truth": 1}, {"key": "39220660", "model": "llama", "target_model": "human", "recognition_score": 0.9246876965589171, "ground_truth": 0}, {"key": "39220660", "model": "llama", "target_model": "claude", "recognition_score": 0.9420819067047768, "ground_truth": 0}, {"key": "39220660", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9522199303274357, "ground_truth": 0}, {"key": "39220660", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8940517067186835, "ground_truth": 0}, {"key": "41028780", "model": "llama", "target_model": "llama", "recognition_score": 0.8840392841939779, "ground_truth": 1}, {"key": "41028780", "model": "llama", "target_model": "human", "recognition_score": 0.8969755657507426, "ground_truth": 0}, {"key": "41028780", "model": "llama", "target_model": "claude", "recognition_score": 0.8633916162237288, "ground_truth": 0}, {"key": "41028780", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8624675348600412, "ground_truth": 0}, {"key": "41028780", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8489722198028761, "ground_truth": 0}, {"key": "39457108", "model": "llama", "target_model": "llama", "recognition_score": 0.7008948187670647, "ground_truth": 1}, {"key": "39457108", "model": "llama", "target_model": "human", "recognition_score": 0.6039318365065534, "ground_truth": 0}, {"key": "39457108", "model": "llama", "target_model": "claude", "recognition_score": 0.7416740344741342, "ground_truth": 0}, {"key": "39457108", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7718434894589444, "ground_truth": 0}, {"key": "39457108", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8031738152495859, "ground_truth": 0}, {"key": "38288018", "model": "llama", "target_model": "llama", "recognition_score": 0.09947021370989567, "ground_truth": 1}, {"key": "38288018", "model": "llama", "target_model": "human", "recognition_score": 0.16238002991439113, "ground_truth": 0}, {"key": "38288018", "model": "llama", "target_model": "claude", "recognition_score": 0.17217185454680273, "ground_truth": 0}, {"key": "38288018", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2766905245123932, "ground_truth": 0}, {"key": "38288018", "model": "llama", "target_model": "gpt35", "recognition_score": 0.18476751142692344, "ground_truth": 0}, {"key": "40106293", "model": "llama", "target_model": "llama", "recognition_score": 0.3073580170084769, "ground_truth": 1}, {"key": "40106293", "model": "llama", "target_model": "human", "recognition_score": 0.4571367349286053, "ground_truth": 0}, {"key": "40106293", "model": "llama", "target_model": "claude", "recognition_score": 0.5175708944121724, "ground_truth": 0}, {"key": "40106293", "model": "llama", "target_model": "gpt4", "recognition_score": 0.27982849433003315, "ground_truth": 0}, {"key": "40106293", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4263215911202563, "ground_truth": 0}, {"key": "39948797", "model": "llama", "target_model": "llama", "recognition_score": 0.8791467574003559, "ground_truth": 1}, {"key": "39948797", "model": "llama", "target_model": "human", "recognition_score": 0.9429286010733902, "ground_truth": 0}, {"key": "39948797", "model": "llama", "target_model": "claude", "recognition_score": 0.8749346100560486, "ground_truth": 0}, {"key": "39948797", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9086178960792433, "ground_truth": 0}, {"key": "39948797", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9032942003370935, "ground_truth": 0}, {"key": "31853399", "model": "llama", "target_model": "llama", "recognition_score": 0.9477691449584815, "ground_truth": 1}, {"key": "31853399", "model": "llama", "target_model": "human", "recognition_score": 0.9026095958832615, "ground_truth": 0}, {"key": "31853399", "model": "llama", "target_model": "claude", "recognition_score": 0.9230391695276775, "ground_truth": 0}, {"key": "31853399", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9309620778077504, "ground_truth": 0}, {"key": "31853399", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9594592615495239, "ground_truth": 0}, {"key": "35273252", "model": "llama", "target_model": "llama", "recognition_score": 0.33285230920771713, "ground_truth": 1}, {"key": "35273252", "model": "llama", "target_model": "human", "recognition_score": 0.700894813692672, "ground_truth": 0}, {"key": "35273252", "model": "llama", "target_model": "claude", "recognition_score": 0.4882834018562492, "ground_truth": 0}, {"key": "35273252", "model": "llama", "target_model": "gpt4", "recognition_score": 0.4707365841009679, "ground_truth": 0}, {"key": "35273252", "model": "llama", "target_model": "gpt35", "recognition_score": 0.24508501992869267, "ground_truth": 0}, {"key": "37130459", "model": "llama", "target_model": "llama", "recognition_score": 0.9661559634412618, "ground_truth": 1}, {"key": "37130459", "model": "llama", "target_model": "human", "recognition_score": 0.9850429136439153, "ground_truth": 0}, {"key": "37130459", "model": "llama", "target_model": "claude", "recognition_score": 0.9635062346392754, "ground_truth": 0}, {"key": "37130459", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9757623652736788, "ground_truth": 0}, {"key": "37130459", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9645892682613425, "ground_truth": 0}, {"key": "21734003", "model": "llama", "target_model": "llama", "recognition_score": 0.8879840505174847, "ground_truth": 1}, {"key": "21734003", "model": "llama", "target_model": "human", "recognition_score": 0.9481545334817223, "ground_truth": 0}, {"key": "21734003", "model": "llama", "target_model": "claude", "recognition_score": 0.9294404024876222, "ground_truth": 0}, {"key": "21734003", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9202179823871317, "ground_truth": 0}, {"key": "21734003", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9079671309809318, "ground_truth": 0}, {"key": "33990737", "model": "llama", "target_model": "llama", "recognition_score": 0.6842640357203517, "ground_truth": 1}, {"key": "33990737", "model": "llama", "target_model": "human", "recognition_score": 0.6688802552108378, "ground_truth": 0}, {"key": "33990737", "model": "llama", "target_model": "claude", "recognition_score": 0.7690802468430623, "ground_truth": 0}, {"key": "33990737", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6842640108268846, "ground_truth": 0}, {"key": "33990737", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8056322123391051, "ground_truth": 0}, {"key": "34559912", "model": "llama", "target_model": "llama", "recognition_score": 0.8955226719620286, "ground_truth": 1}, {"key": "34559912", "model": "llama", "target_model": "human", "recognition_score": 0.9278877873575897, "ground_truth": 0}, {"key": "34559912", "model": "llama", "target_model": "claude", "recognition_score": 0.9329437121690484, "ground_truth": 0}, {"key": "34559912", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8697145844504941, "ground_truth": 0}, {"key": "34559912", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9155072434777025, "ground_truth": 0}, {"key": "39820439", "model": "llama", "target_model": "llama", "recognition_score": 0.31573596031723683, "ground_truth": 1}, {"key": "39820439", "model": "llama", "target_model": "human", "recognition_score": 0.4263215699264888, "ground_truth": 0}, {"key": "39820439", "model": "llama", "target_model": "claude", "recognition_score": 0.550607381538942, "ground_truth": 0}, {"key": "39820439", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3276683143402195, "ground_truth": 0}, {"key": "39820439", "model": "llama", "target_model": "gpt35", "recognition_score": 0.29746993820951867, "ground_truth": 0}, {"key": "34759328", "model": "llama", "target_model": "llama", "recognition_score": 0.9381240122796715, "ground_truth": 1}, {"key": "34759328", "model": "llama", "target_model": "human", "recognition_score": 0.9782188288800573, "ground_truth": 0}, {"key": "34759328", "model": "llama", "target_model": "claude", "recognition_score": 0.9635062322899443, "ground_truth": 0}, {"key": "34759328", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9795114463949746, "ground_truth": 0}, {"key": "34759328", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9861513891084247, "ground_truth": 0}, {"key": "36939137", "model": "llama", "target_model": "llama", "recognition_score": 0.8723473804694714, "ground_truth": 1}, {"key": "36939137", "model": "llama", "target_model": "human", "recognition_score": 0.830043766882903, "ground_truth": 0}, {"key": "36939137", "model": "llama", "target_model": "claude", "recognition_score": 0.7799929071953116, "ground_truth": 0}, {"key": "36939137", "model": "llama", "target_model": "gpt4", "recognition_score": 0.955651419761453, "ground_truth": 0}, {"key": "36939137", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8807970764760632, "ground_truth": 0}, {"key": "35851522", "model": "llama", "target_model": "llama", "recognition_score": 0.8449215387172384, "ground_truth": 1}, {"key": "35851522", "model": "llama", "target_model": "human", "recognition_score": 0.8519528244852933, "ground_truth": 0}, {"key": "35851522", "model": "llama", "target_model": "claude", "recognition_score": 0.8848377764495485, "ground_truth": 0}, {"key": "35851522", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8799743748576628, "ground_truth": 0}, {"key": "35851522", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7732163486292802, "ground_truth": 0}, {"key": "22412782", "model": "llama", "target_model": "llama", "recognition_score": 0.8068526295002886, "ground_truth": 1}, {"key": "22412782", "model": "llama", "target_model": "human", "recognition_score": 0.8300437685358837, "ground_truth": 0}, {"key": "22412782", "model": "llama", "target_model": "claude", "recognition_score": 0.8984105513655121, "ground_truth": 0}, {"key": "22412782", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7446563338967515, "ground_truth": 0}, {"key": "22412782", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8774767856535031, "ground_truth": 0}, {"key": "38579227", "model": "llama", "target_model": "llama", "recognition_score": 0.9612438067340318, "ground_truth": 1}, {"key": "38579227", "model": "llama", "target_model": "human", "recognition_score": 0.9385759625084509, "ground_truth": 0}, {"key": "38579227", "model": "llama", "target_model": "claude", "recognition_score": 0.8879840513709352, "ground_truth": 0}, {"key": "38579227", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9713473307813314, "ground_truth": 0}, {"key": "38579227", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9635062336115037, "ground_truth": 0}, {"key": "37206995", "model": "llama", "target_model": "llama", "recognition_score": 0.8816149095340081, "ground_truth": 1}, {"key": "37206995", "model": "llama", "target_model": "human", "recognition_score": 0.9289263286905027, "ground_truth": 0}, {"key": "37206995", "model": "llama", "target_model": "claude", "recognition_score": 0.887984056695292, "ground_truth": 0}, {"key": "37206995", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8887587939968217, "ground_truth": 0}, {"key": "37206995", "model": "llama", "target_model": "gpt35", "recognition_score": 0.840782602884086, "ground_truth": 0}, {"key": "38700847", "model": "llama", "target_model": "llama", "recognition_score": 0.8697145885681379, "ground_truth": 1}, {"key": "38700847", "model": "llama", "target_model": "human", "recognition_score": 0.9005297919509779, "ground_truth": 0}, {"key": "38700847", "model": "llama", "target_model": "claude", "recognition_score": 0.8791467805420204, "ground_truth": 0}, {"key": "38700847", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8568122887430542, "ground_truth": 0}, {"key": "38700847", "model": "llama", "target_model": "gpt35", "recognition_score": 0.773216368881061, "ground_truth": 0}, {"key": "20246590", "model": "llama", "target_model": "llama", "recognition_score": 0.9791955078419946, "ground_truth": 1}, {"key": "20246590", "model": "llama", "target_model": "human", "recognition_score": 0.993202468120519, "ground_truth": 0}, {"key": "20246590", "model": "llama", "target_model": "claude", "recognition_score": 0.9830850880774397, "ground_truth": 0}, {"key": "20246590", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9843363514137747, "ground_truth": 0}, {"key": "20246590", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9843363513400922, "ground_truth": 0}, {"key": "39141360", "model": "llama", "target_model": "llama", "recognition_score": 0.9362850033495379, "ground_truth": 1}, {"key": "39141360", "model": "llama", "target_model": "human", "recognition_score": 0.8344068900603087, "ground_truth": 0}, {"key": "39141360", "model": "llama", "target_model": "claude", "recognition_score": 0.8807970713952489, "ground_truth": 0}, {"key": "39141360", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8955226758845451, "ground_truth": 0}, {"key": "39141360", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8984105596759263, "ground_truth": 0}, {"key": "37906226", "model": "llama", "target_model": "llama", "recognition_score": 0.7279754651555123, "ground_truth": 1}, {"key": "37906226", "model": "llama", "target_model": "human", "recognition_score": 0.7008948003201346, "ground_truth": 0}, {"key": "37906226", "model": "llama", "target_model": "claude", "recognition_score": 0.5312093662994288, "ground_truth": 0}, {"key": "37906226", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6460136872686336, "ground_truth": 0}, {"key": "37906226", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6842640172045451, "ground_truth": 0}, {"key": "16201033", "model": "llama", "target_model": "llama", "recognition_score": 0.8479677548192522, "ground_truth": 1}, {"key": "16201033", "model": "llama", "target_model": "human", "recognition_score": 0.8783142429353588, "ground_truth": 0}, {"key": "16201033", "model": "llama", "target_model": "claude", "recognition_score": 0.921357613889423, "ground_truth": 0}, {"key": "16201033", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8615382095900324, "ground_truth": 0}, {"key": "16201033", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8140528022878907, "ground_truth": 0}, {"key": "36469022", "model": "llama", "target_model": "llama", "recognition_score": 0.7505527604778188, "ground_truth": 1}, {"key": "36469022", "model": "llama", "target_model": "human", "recognition_score": 0.5506073775127077, "ground_truth": 0}, {"key": "36469022", "model": "llama", "target_model": "claude", "recognition_score": 0.6706082729426165, "ground_truth": 0}, {"key": "36469022", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8116760188554174, "ground_truth": 0}, {"key": "36469022", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5660185340454091, "ground_truth": 0}, {"key": "31295270", "model": "llama", "target_model": "llama", "recognition_score": 0.26435836012284775, "ground_truth": 1}, {"key": "31295270", "model": "llama", "target_model": "human", "recognition_score": 0.32423540281173074, "ground_truth": 0}, {"key": "31295270", "model": "llama", "target_model": "claude", "recognition_score": 0.1451153626462114, "ground_truth": 0}, {"key": "31295270", "model": "llama", "target_model": "gpt4", "recognition_score": 0.36296920997352544, "ground_truth": 0}, {"key": "31295270", "model": "llama", "target_model": "gpt35", "recognition_score": 0.2538609980202233, "ground_truth": 0}, {"key": "35360689", "model": "llama", "target_model": "llama", "recognition_score": 0.6370307729541204, "ground_truth": 1}, {"key": "35360689", "model": "llama", "target_model": "human", "recognition_score": 0.5292633896823885, "ground_truth": 0}, {"key": "35360689", "model": "llama", "target_model": "claude", "recognition_score": 0.46490155879861933, "ground_truth": 0}, {"key": "35360689", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3575675483233045, "ground_truth": 0}, {"key": "35360689", "model": "llama", "target_model": "gpt35", "recognition_score": 0.45132649889021254, "ground_truth": 0}, {"key": "29202793", "model": "llama", "target_model": "llama", "recognition_score": 0.5312093898393933, "ground_truth": 1}, {"key": "29202793", "model": "llama", "target_model": "human", "recognition_score": 0.3998116257923887, "ground_truth": 0}, {"key": "29202793", "model": "llama", "target_model": "claude", "recognition_score": 0.5467381549265111, "ground_truth": 0}, {"key": "29202793", "model": "llama", "target_model": "gpt4", "recognition_score": 0.30569732249826154, "ground_truth": 0}, {"key": "29202793", "model": "llama", "target_model": "gpt35", "recognition_score": 0.49023565125393487, "ground_truth": 0}, {"key": "35999008", "model": "llama", "target_model": "llama", "recognition_score": 0.6808786054522009, "ground_truth": 1}, {"key": "35999008", "model": "llama", "target_model": "human", "recognition_score": 0.43206339566868823, "ground_truth": 0}, {"key": "35999008", "model": "llama", "target_model": "claude", "recognition_score": 0.7310586085074422, "ground_truth": 0}, {"key": "35999008", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7386690560006005, "ground_truth": 0}, {"key": "35999008", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8311430428669693, "ground_truth": 0}, {"key": "31797119", "model": "llama", "target_model": "llama", "recognition_score": 0.9026095943335095, "ground_truth": 1}, {"key": "31797119", "model": "llama", "target_model": "human", "recognition_score": 0.7943849515563397, "ground_truth": 0}, {"key": "31797119", "model": "llama", "target_model": "claude", "recognition_score": 0.9066531169602603, "ground_truth": 0}, {"key": "31797119", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8998277771457477, "ground_truth": 0}, {"key": "31797119", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8407825877256752, "ground_truth": 0}, {"key": "26711893", "model": "llama", "target_model": "llama", "recognition_score": 0.7879312109480427, "ground_truth": 1}, {"key": "26711893", "model": "llama", "target_model": "human", "recognition_score": 0.7662936599617293, "ground_truth": 0}, {"key": "26711893", "model": "llama", "target_model": "claude", "recognition_score": 0.8044059062720453, "ground_truth": 0}, {"key": "26711893", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7057850235164148, "ground_truth": 0}, {"key": "26711893", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6992544066215857, "ground_truth": 0}, {"key": "35348288", "model": "llama", "target_model": "llama", "recognition_score": 0.5486734558067186, "ground_truth": 1}, {"key": "35348288", "model": "llama", "target_model": "human", "recognition_score": 0.5563995492784641, "ground_truth": 0}, {"key": "35348288", "model": "llama", "target_model": "claude", "recognition_score": 0.4130035553222369, "ground_truth": 0}, {"key": "35348288", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6959583151057354, "ground_truth": 0}, {"key": "35348288", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6242935370329055, "ground_truth": 0}, {"key": "38124131", "model": "llama", "target_model": "llama", "recognition_score": 0.20055767361148416, "ground_truth": 1}, {"key": "38124131", "model": "llama", "target_model": "human", "recognition_score": 0.1895211041740008, "ground_truth": 0}, {"key": "38124131", "model": "llama", "target_model": "claude", "recognition_score": 0.42059959112554907, "ground_truth": 0}, {"key": "38124131", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3539863177479662, "ground_truth": 0}, {"key": "38124131", "model": "llama", "target_model": "gpt35", "recognition_score": 0.36296919957311535, "ground_truth": 0}, {"key": "20285901", "model": "llama", "target_model": "llama", "recognition_score": 0.8376199857151232, "ground_truth": 1}, {"key": "20285901", "model": "llama", "target_model": "human", "recognition_score": 0.8438951000373534, "ground_truth": 0}, {"key": "20285901", "model": "llama", "target_model": "claude", "recognition_score": 0.8116760211746853, "ground_truth": 0}, {"key": "20285901", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9092645064983159, "ground_truth": 0}, {"key": "20285901", "model": "llama", "target_model": "gpt35", "recognition_score": 0.825589726696874, "ground_truth": 0}, {"key": "35633632", "model": "llama", "target_model": "llama", "recognition_score": 0.8509646941538791, "ground_truth": 1}, {"key": "35633632", "model": "llama", "target_model": "human", "recognition_score": 0.7264255988664654, "ground_truth": 0}, {"key": "35633632", "model": "llama", "target_model": "claude", "recognition_score": 0.7745833941911541, "ground_truth": 0}, {"key": "35633632", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8365545656715905, "ground_truth": 0}, {"key": "35633632", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9111797057651762, "ground_truth": 0}, {"key": "10741274", "model": "llama", "target_model": "llama", "recognition_score": 0.6859494685972058, "ground_truth": 1}, {"key": "10741274", "model": "llama", "target_model": "human", "recognition_score": 0.5448014130558293, "ground_truth": 0}, {"key": "10741274", "model": "llama", "target_model": "claude", "recognition_score": 0.5736784174083824, "ground_truth": 0}, {"key": "10741274", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5660185434433977, "ground_truth": 0}, {"key": "10741274", "model": "llama", "target_model": "gpt35", "recognition_score": 0.39233681718470365, "ground_truth": 0}, {"key": "30605795", "model": "llama", "target_model": "llama", "recognition_score": 0.8558511463918553, "ground_truth": 1}, {"key": "30605795", "model": "llama", "target_model": "human", "recognition_score": 0.7866228379517588, "ground_truth": 0}, {"key": "30605795", "model": "llama", "target_model": "claude", "recognition_score": 0.7563575594756811, "ground_truth": 0}, {"key": "30605795", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8848377618101769, "ground_truth": 0}, {"key": "30605795", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7956580914137769, "ground_truth": 0}, {"key": "30539722", "model": "llama", "target_model": "llama", "recognition_score": 0.8152324895960317, "ground_truth": 1}, {"key": "30539722", "model": "llama", "target_model": "human", "recognition_score": 0.6113819826514963, "ground_truth": 0}, {"key": "30539722", "model": "llama", "target_model": "claude", "recognition_score": 0.8925625232171531, "ground_truth": 0}, {"key": "30539722", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8633916007666224, "ground_truth": 0}, {"key": "30539722", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8233284045379157, "ground_truth": 0}, {"key": "18639299", "model": "llama", "target_model": "llama", "recognition_score": 0.3557748859892262, "ground_truth": 1}, {"key": "18639299", "model": "llama", "target_model": "human", "recognition_score": 0.23651623282997586, "ground_truth": 0}, {"key": "18639299", "model": "llama", "target_model": "claude", "recognition_score": 0.1955940853555394, "ground_truth": 0}, {"key": "18639299", "model": "llama", "target_model": "gpt4", "recognition_score": 0.24220562980547092, "ground_truth": 0}, {"key": "18639299", "model": "llama", "target_model": "gpt35", "recognition_score": 0.16238002847425248, "ground_truth": 0}, {"key": "39773552", "model": "llama", "target_model": "llama", "recognition_score": 0.8596637559811949, "ground_truth": 1}, {"key": "39773552", "model": "llama", "target_model": "human", "recognition_score": 0.8539127620590887, "ground_truth": 0}, {"key": "39773552", "model": "llama", "target_model": "claude", "recognition_score": 0.6706082822485426, "ground_truth": 0}, {"key": "39773552", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7248702570086551, "ground_truth": 0}, {"key": "39773552", "model": "llama", "target_model": "gpt35", "recognition_score": 0.723309473370052, "ground_truth": 0}, {"key": "34086410", "model": "llama", "target_model": "llama", "recognition_score": 0.7534666573715537, "ground_truth": 1}, {"key": "34086410", "model": "llama", "target_model": "human", "recognition_score": 0.5136684660807203, "ground_truth": 0}, {"key": "34086410", "model": "llama", "target_model": "claude", "recognition_score": 0.5983121530403185, "ground_truth": 0}, {"key": "34086410", "model": "llama", "target_model": "gpt4", "recognition_score": 0.42059961698557424, "ground_truth": 0}, {"key": "34086410", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7264256282366387, "ground_truth": 0}, {"key": "35454652", "model": "llama", "target_model": "llama", "recognition_score": 0.7994423249738041, "ground_truth": 1}, {"key": "35454652", "model": "llama", "target_model": "human", "recognition_score": 0.9079671459903038, "ground_truth": 0}, {"key": "35454652", "model": "llama", "target_model": "claude", "recognition_score": 0.8940517153439365, "ground_truth": 0}, {"key": "35454652", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8661325233432478, "ground_truth": 0}, {"key": "35454652", "model": "llama", "target_model": "gpt35", "recognition_score": 0.932453304242117, "ground_truth": 0}, {"key": "36158310", "model": "llama", "target_model": "llama", "recognition_score": 0.9309620687162802, "ground_truth": 1}, {"key": "36158310", "model": "llama", "target_model": "human", "recognition_score": 0.6740504956949316, "ground_truth": 0}, {"key": "36158310", "model": "llama", "target_model": "claude", "recognition_score": 0.9481545363051025, "ground_truth": 0}, {"key": "36158310", "model": "llama", "target_model": "gpt4", "recognition_score": 0.903294205378511, "ground_truth": 0}, {"key": "36158310", "model": "llama", "target_model": "gpt35", "recognition_score": 0.833324583685284, "ground_truth": 0}, {"key": "35688387", "model": "llama", "target_model": "llama", "recognition_score": 0.4320633835077725, "ground_truth": 1}, {"key": "35688387", "model": "llama", "target_model": "human", "recognition_score": 0.853912758453587, "ground_truth": 0}, {"key": "35688387", "model": "llama", "target_model": "claude", "recognition_score": 0.2909808784052067, "ground_truth": 0}, {"key": "35688387", "model": "llama", "target_model": "gpt4", "recognition_score": 0.47852885960299685, "ground_truth": 0}, {"key": "35688387", "model": "llama", "target_model": "gpt35", "recognition_score": 0.49218812491284814, "ground_truth": 0}, {"key": "34209292", "model": "llama", "target_model": "llama", "recognition_score": 0.9403530519318425, "ground_truth": 1}, {"key": "34209292", "model": "llama", "target_model": "human", "recognition_score": 0.826711777594197, "ground_truth": 0}, {"key": "34209292", "model": "llama", "target_model": "claude", "recognition_score": 0.8418256582782532, "ground_truth": 0}, {"key": "34209292", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9046505326355497, "ground_truth": 0}, {"key": "34209292", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8902942171812653, "ground_truth": 0}, {"key": "25037859", "model": "llama", "target_model": "llama", "recognition_score": 0.6442250830923733, "ground_truth": 1}, {"key": "25037859", "model": "llama", "target_model": "human", "recognition_score": 0.5851011483751993, "ground_truth": 0}, {"key": "25037859", "model": "llama", "target_model": "claude", "recognition_score": 0.560252631647647, "ground_truth": 0}, {"key": "25037859", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7839884838096002, "ground_truth": 0}, {"key": "25037859", "model": "llama", "target_model": "gpt35", "recognition_score": 0.667147660744635, "ground_truth": 0}, {"key": "36412121", "model": "llama", "target_model": "llama", "recognition_score": 0.9299510291877199, "ground_truth": 1}, {"key": "36412121", "model": "llama", "target_model": "human", "recognition_score": 0.9358173534199413, "ground_truth": 0}, {"key": "36412121", "model": "llama", "target_model": "claude", "recognition_score": 0.9314625089161044, "ground_truth": 0}, {"key": "36412121", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9515039960389362, "ground_truth": 0}, {"key": "36412121", "model": "llama", "target_model": "gpt35", "recognition_score": 0.891054956414337, "ground_truth": 0}, {"key": "34909172", "model": "llama", "target_model": "llama", "recognition_score": 0.8864204080347406, "ground_truth": 1}, {"key": "34909172", "model": "llama", "target_model": "human", "recognition_score": 0.9046505257824986, "ground_truth": 0}, {"key": "34909172", "model": "llama", "target_model": "claude", "recognition_score": 0.8044059276512338, "ground_truth": 0}, {"key": "34909172", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9348724574533858, "ground_truth": 0}, {"key": "34909172", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8386797780095983, "ground_truth": 0}, {"key": "39011806", "model": "llama", "target_model": "llama", "recognition_score": 0.8969755687941116, "ground_truth": 1}, {"key": "39011806", "model": "llama", "target_model": "human", "recognition_score": 0.822189132646189, "ground_truth": 0}, {"key": "39011806", "model": "llama", "target_model": "claude", "recognition_score": 0.8705972752879693, "ground_truth": 0}, {"key": "39011806", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8233283979406815, "ground_truth": 0}, {"key": "39011806", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8354835396925759, "ground_truth": 0}, {"key": "33096163", "model": "llama", "target_model": "llama", "recognition_score": 0.8840392806847276, "ground_truth": 1}, {"key": "33096163", "model": "llama", "target_model": "human", "recognition_score": 0.9289263311417694, "ground_truth": 0}, {"key": "33096163", "model": "llama", "target_model": "claude", "recognition_score": 0.9012274115432753, "ground_truth": 0}, {"key": "33096163", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8749346116685871, "ground_truth": 0}, {"key": "33096163", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9136765197172497, "ground_truth": 0}, {"key": "38762205", "model": "llama", "target_model": "llama", "recognition_score": 0.9429286062471314, "ground_truth": 1}, {"key": "38762205", "model": "llama", "target_model": "human", "recognition_score": 0.9746286898280561, "ground_truth": 0}, {"key": "38762205", "model": "llama", "target_model": "claude", "recognition_score": 0.9079671403917308, "ground_truth": 0}, {"key": "38762205", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9744347838237348, "ground_truth": 0}, {"key": "38762205", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9546474227438345, "ground_truth": 0}, {"key": "35519177", "model": "llama", "target_model": "llama", "recognition_score": 0.8697145793918836, "ground_truth": 1}, {"key": "35519177", "model": "llama", "target_model": "human", "recognition_score": 0.7057850355565172, "ground_truth": 0}, {"key": "35519177", "model": "llama", "target_model": "claude", "recognition_score": 0.9572778031663457, "ground_truth": 0}, {"key": "35519177", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9324533080660722, "ground_truth": 0}, {"key": "35519177", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9416541610272103, "ground_truth": 0}, {"key": "36192531", "model": "llama", "target_model": "llama", "recognition_score": 0.8428631643513883, "ground_truth": 1}, {"key": "36192531", "model": "llama", "target_model": "human", "recognition_score": 0.7264256088261732, "ground_truth": 0}, {"key": "36192531", "model": "llama", "target_model": "claude", "recognition_score": 0.6859494556435174, "ground_truth": 0}, {"key": "36192531", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8092759727606792, "ground_truth": 0}, {"key": "36192531", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9449947116973829, "ground_truth": 0}, {"key": "33160852", "model": "llama", "target_model": "llama", "recognition_score": 0.9433475769630333, "ground_truth": 1}, {"key": "33160852", "model": "llama", "target_model": "human", "recognition_score": 0.8354835229703691, "ground_truth": 0}, {"key": "33160852", "model": "llama", "target_model": "claude", "recognition_score": 0.9173026517531041, "ground_truth": 0}, {"key": "33160852", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9358173565812359, "ground_truth": 0}, {"key": "33160852", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8740772230400234, "ground_truth": 0}, {"key": "36312304", "model": "llama", "target_model": "llama", "recognition_score": 0.6876299849644254, "ground_truth": 1}, {"key": "36312304", "model": "llama", "target_model": "human", "recognition_score": 0.5869964481938977, "ground_truth": 0}, {"key": "36312304", "model": "llama", "target_model": "claude", "recognition_score": 0.5717666017635068, "ground_truth": 0}, {"key": "36312304", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7490872202458398, "ground_truth": 0}, {"key": "36312304", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6095241617147549, "ground_truth": 0}, {"key": "33773343", "model": "llama", "target_model": "llama", "recognition_score": 0.4863315275870731, "ground_truth": 1}, {"key": "33773343", "model": "llama", "target_model": "human", "recognition_score": 0.5428632857381857, "ground_truth": 0}, {"key": "33773343", "model": "llama", "target_model": "claude", "recognition_score": 0.6169358458039379, "ground_truth": 0}, {"key": "33773343", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5717665838634893, "ground_truth": 0}, {"key": "33773343", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5583269988208599, "ground_truth": 0}, {"key": "34913320", "model": "llama", "target_model": "llama", "recognition_score": 0.7839884590535824, "ground_truth": 1}, {"key": "34913320", "model": "llama", "target_model": "human", "recognition_score": 0.8164063740203557, "ground_truth": 0}, {"key": "34913320", "model": "llama", "target_model": "claude", "recognition_score": 0.6723316947995878, "ground_truth": 0}, {"key": "34913320", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7718435151392201, "ground_truth": 0}, {"key": "34913320", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7341195388917672, "ground_truth": 0}, {"key": "33784155", "model": "llama", "target_model": "llama", "recognition_score": 0.8799743802396262, "ground_truth": 1}, {"key": "33784155", "model": "llama", "target_model": "human", "recognition_score": 0.9549844663693356, "ground_truth": 0}, {"key": "33784155", "model": "llama", "target_model": "claude", "recognition_score": 0.8918110445443638, "ground_truth": 0}, {"key": "33784155", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9207896817902724, "ground_truth": 0}, {"key": "33784155", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8438950951951891, "ground_truth": 0}, {"key": "24085062", "model": "llama", "target_model": "llama", "recognition_score": 0.98926483804639, "ground_truth": 1}, {"key": "24085062", "model": "llama", "target_model": "human", "recognition_score": 0.9986006016362267, "ground_truth": 0}, {"key": "24085062", "model": "llama", "target_model": "claude", "recognition_score": 0.9853843290167674, "ground_truth": 0}, {"key": "24085062", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9843363516287078, "ground_truth": 0}, {"key": "24085062", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9764905464445999, "ground_truth": 0}, {"key": "33893487", "model": "llama", "target_model": "llama", "recognition_score": 0.6943026744256319, "ground_truth": 1}, {"key": "33893487", "model": "llama", "target_model": "human", "recognition_score": 0.35220177314406814, "ground_truth": 0}, {"key": "33893487", "model": "llama", "target_model": "claude", "recognition_score": 0.5774953430751654, "ground_truth": 0}, {"key": "33893487", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7520125757430844, "ground_truth": 0}, {"key": "33893487", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4610167659592904, "ground_truth": 0}, {"key": "40913011", "model": "llama", "target_model": "llama", "recognition_score": 0.9196425381510129, "ground_truth": 1}, {"key": "40913011", "model": "llama", "target_model": "human", "recognition_score": 0.9079671378303118, "ground_truth": 0}, {"key": "40913011", "model": "llama", "target_model": "claude", "recognition_score": 0.9353465124711012, "ground_truth": 0}, {"key": "40913011", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9536217958223755, "ground_truth": 0}, {"key": "40913011", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9416541598028642, "ground_truth": 0}, {"key": "29642545", "model": "llama", "target_model": "llama", "recognition_score": 0.6315943034873662, "ground_truth": 1}, {"key": "29642545", "model": "llama", "target_model": "human", "recognition_score": 0.6169358171440261, "ground_truth": 0}, {"key": "29642545", "model": "llama", "target_model": "claude", "recognition_score": 0.5058590910503421, "ground_truth": 0}, {"key": "29642545", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3757064645019174, "ground_truth": 0}, {"key": "29642545", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3433417246677697, "ground_truth": 0}, {"key": "35969159", "model": "llama", "target_model": "llama", "recognition_score": 0.9124361515409817, "ground_truth": 1}, {"key": "35969159", "model": "llama", "target_model": "human", "recognition_score": 0.8925625231385839, "ground_truth": 0}, {"key": "35969159", "model": "llama", "target_model": "claude", "recognition_score": 0.9046505353528645, "ground_truth": 0}, {"key": "35969159", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9073122237315587, "ground_truth": 0}, {"key": "35969159", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8198933464162292, "ground_truth": 0}, {"key": "37081669", "model": "llama", "target_model": "llama", "recognition_score": 0.262841826193042, "ground_truth": 1}, {"key": "37081669", "model": "llama", "target_model": "human", "recognition_score": 0.30404167184706254, "ground_truth": 0}, {"key": "37081669", "model": "llama", "target_model": "claude", "recognition_score": 0.3830641815220787, "ground_truth": 0}, {"key": "37081669", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6548947090861824, "ground_truth": 0}, {"key": "37081669", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6039318431769081, "ground_truth": 0}, {"key": "40048022", "model": "llama", "target_model": "llama", "recognition_score": 0.8933094022247791, "ground_truth": 1}, {"key": "40048022", "model": "llama", "target_model": "human", "recognition_score": 0.8791467571816302, "ground_truth": 0}, {"key": "40048022", "model": "llama", "target_model": "claude", "recognition_score": 0.867035757827712, "ground_truth": 0}, {"key": "40048022", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8670357500309596, "ground_truth": 0}, {"key": "40048022", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8558511439360428, "ground_truth": 0}, {"key": "32884004", "model": "llama", "target_model": "llama", "recognition_score": 0.8969755724500388, "ground_truth": 1}, {"key": "32884004", "model": "llama", "target_model": "human", "recognition_score": 0.9615338074899406, "ground_truth": 0}, {"key": "32884004", "model": "llama", "target_model": "claude", "recognition_score": 0.8056321775615471, "ground_truth": 0}, {"key": "32884004", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9289263266801611, "ground_truth": 0}, {"key": "32884004", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7994423038320027, "ground_truth": 0}, {"key": "39022490", "model": "llama", "target_model": "llama", "recognition_score": 0.9092645201262369, "ground_truth": 1}, {"key": "39022490", "model": "llama", "target_model": "human", "recognition_score": 0.9529258269818887, "ground_truth": 0}, {"key": "39022490", "model": "llama", "target_model": "claude", "recognition_score": 0.8679338485398612, "ground_truth": 0}, {"key": "39022490", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9353465143064151, "ground_truth": 0}, {"key": "39022490", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8940517094729209, "ground_truth": 0}, {"key": "35159385", "model": "llama", "target_model": "llama", "recognition_score": 0.9118099651104086, "ground_truth": 1}, {"key": "35159385", "model": "llama", "target_model": "human", "recognition_score": 0.8940517178915139, "ground_truth": 0}, {"key": "35159385", "model": "llama", "target_model": "claude", "recognition_score": 0.872347386106209, "ground_truth": 0}, {"key": "35159385", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9130583391361649, "ground_truth": 0}, {"key": "35159385", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9235923174695945, "ground_truth": 0}, {"key": "34363669", "model": "llama", "target_model": "llama", "recognition_score": 0.4513264963417892, "ground_truth": 1}, {"key": "34363669", "model": "llama", "target_model": "human", "recognition_score": 0.26284182796360334, "ground_truth": 0}, {"key": "34363669", "model": "llama", "target_model": "claude", "recognition_score": 0.4941408897033868, "ground_truth": 0}, {"key": "34363669", "model": "llama", "target_model": "gpt4", "recognition_score": 0.39981166513058847, "ground_truth": 0}, {"key": "34363669", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3812195466023871, "ground_truth": 0}, {"key": "36119687", "model": "llama", "target_model": "llama", "recognition_score": 0.9588471111671559, "ground_truth": 1}, {"key": "36119687", "model": "llama", "target_model": "human", "recognition_score": 0.9603611649433335, "ground_truth": 0}, {"key": "36119687", "model": "llama", "target_model": "claude", "recognition_score": 0.9615338089954161, "ground_truth": 0}, {"key": "36119687", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9876638993201149, "ground_truth": 0}, {"key": "36119687", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9700134925025463, "ground_truth": 0}, {"key": "35217446", "model": "llama", "target_model": "llama", "recognition_score": 0.881614899365922, "ground_truth": 1}, {"key": "35217446", "model": "llama", "target_model": "human", "recognition_score": 0.9005297868415852, "ground_truth": 0}, {"key": "35217446", "model": "llama", "target_model": "claude", "recognition_score": 0.8568123115774476, "ground_truth": 0}, {"key": "35217446", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9294403994314628, "ground_truth": 0}, {"key": "35217446", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9496693682448624, "ground_truth": 0}, {"key": "39049331", "model": "llama", "target_model": "llama", "recognition_score": 0.8479677543312082, "ground_truth": 1}, {"key": "39049331", "model": "llama", "target_model": "human", "recognition_score": 0.9362850034561181, "ground_truth": 0}, {"key": "39049331", "model": "llama", "target_model": "claude", "recognition_score": 0.78266247500368, "ground_truth": 0}, {"key": "39049331", "model": "llama", "target_model": "gpt4", "recognition_score": 0.884837767874072, "ground_truth": 0}, {"key": "39049331", "model": "llama", "target_model": "gpt35", "recognition_score": 0.931462505734195, "ground_truth": 0}, {"key": "36472242", "model": "llama", "target_model": "llama", "recognition_score": 0.9099070064131008, "ground_truth": 1}, {"key": "36472242", "model": "llama", "target_model": "human", "recognition_score": 0.9190632909494348, "ground_truth": 0}, {"key": "36472242", "model": "llama", "target_model": "claude", "recognition_score": 0.9778834118189987, "ground_truth": 0}, {"key": "36472242", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9339146160483026, "ground_truth": 0}, {"key": "36472242", "model": "llama", "target_model": "gpt35", "recognition_score": 0.932943708895925, "ground_truth": 0}, {"key": "31854721", "model": "llama", "target_model": "llama", "recognition_score": 0.8714748652274065, "ground_truth": 1}, {"key": "31854721", "model": "llama", "target_model": "human", "recognition_score": 0.7520125640566013, "ground_truth": 0}, {"key": "31854721", "model": "llama", "target_model": "claude", "recognition_score": 0.8267117976944968, "ground_truth": 0}, {"key": "31854721", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8940517132778109, "ground_truth": 0}, {"key": "31854721", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8577680981717348, "ground_truth": 0}, {"key": "18725849", "model": "llama", "target_model": "llama", "recognition_score": 0.6187804334312971, "ground_truth": 1}, {"key": "18725849", "model": "llama", "target_model": "human", "recognition_score": 0.5755880064570785, "ground_truth": 0}, {"key": "18725849", "model": "llama", "target_model": "claude", "recognition_score": 0.523420351049277, "ground_truth": 0}, {"key": "18725849", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5888891165670842, "ground_truth": 0}, {"key": "18725849", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7310585596260107, "ground_truth": 0}, {"key": "36883179", "model": "llama", "target_model": "llama", "recognition_score": 0.4111108654748893, "ground_truth": 1}, {"key": "36883179", "model": "llama", "target_model": "human", "recognition_score": 0.5234203539110984, "ground_truth": 0}, {"key": "36883179", "model": "llama", "target_model": "claude", "recognition_score": 0.2991051997433037, "ground_truth": 0}, {"key": "36883179", "model": "llama", "target_model": "gpt4", "recognition_score": 0.359364115443186, "ground_truth": 0}, {"key": "36883179", "model": "llama", "target_model": "gpt35", "recognition_score": 0.45519859288446746, "ground_truth": 0}, {"key": "34266359", "model": "llama", "target_model": "llama", "recognition_score": 0.7592254259494994, "ground_truth": 1}, {"key": "34266359", "model": "llama", "target_model": "human", "recognition_score": 0.8723473774619784, "ground_truth": 0}, {"key": "34266359", "model": "llama", "target_model": "claude", "recognition_score": 0.90260960296147, "ground_truth": 0}, {"key": "34266359", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9039745200070785, "ground_truth": 0}, {"key": "34266359", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9178933731249853, "ground_truth": 0}, {"key": "31920289", "model": "llama", "target_model": "llama", "recognition_score": 0.6001883532761363, "ground_truth": 1}, {"key": "31920289", "model": "llama", "target_model": "human", "recognition_score": 0.6388352872113063, "ground_truth": 0}, {"key": "31920289", "model": "llama", "target_model": "claude", "recognition_score": 0.6926419748467478, "ground_truth": 0}, {"key": "31920289", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5350984414339246, "ground_truth": 0}, {"key": "31920289", "model": "llama", "target_model": "gpt35", "recognition_score": 0.39606817133800204, "ground_truth": 0}, {"key": "36292997", "model": "llama", "target_model": "llama", "recognition_score": 0.7931059511687426, "ground_truth": 1}, {"key": "36292997", "model": "llama", "target_model": "human", "recognition_score": 0.8233284011722272, "ground_truth": 0}, {"key": "36292997", "model": "llama", "target_model": "claude", "recognition_score": 0.8807970642591185, "ground_truth": 0}, {"key": "36292997", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9257686309808092, "ground_truth": 0}, {"key": "36292997", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9066531206109664, "ground_truth": 0}, {"key": "30412533", "model": "llama", "target_model": "llama", "recognition_score": 0.9005297802131476, "ground_truth": 1}, {"key": "30412533", "model": "llama", "target_model": "human", "recognition_score": 0.855851138023168, "ground_truth": 0}, {"key": "30412533", "model": "llama", "target_model": "claude", "recognition_score": 0.8895288571238568, "ground_truth": 0}, {"key": "30412533", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8991213698418379, "ground_truth": 0}, {"key": "30412533", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8856314663534955, "ground_truth": 0}, {"key": "40433191", "model": "llama", "target_model": "llama", "recognition_score": 0.9629528312478451, "ground_truth": 1}, {"key": "40433191", "model": "llama", "target_model": "human", "recognition_score": 0.9629528320629097, "ground_truth": 0}, {"key": "40433191", "model": "llama", "target_model": "claude", "recognition_score": 0.9730364995673975, "ground_truth": 0}, {"key": "40433191", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9637799464852621, "ground_truth": 0}, {"key": "40433191", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9736446468896739, "ground_truth": 0}, {"key": "34565591", "model": "llama", "target_model": "llama", "recognition_score": 0.1338674828087401, "ground_truth": 1}, {"key": "34565591", "model": "llama", "target_model": "human", "recognition_score": 0.5679365917129139, "ground_truth": 0}, {"key": "34565591", "model": "llama", "target_model": "claude", "recognition_score": 0.5755880402730849, "ground_truth": 0}, {"key": "34565591", "model": "llama", "target_model": "gpt4", "recognition_score": 0.36477755561995623, "ground_truth": 0}, {"key": "34565591", "model": "llama", "target_model": "gpt35", "recognition_score": 0.29746994649416575, "ground_truth": 0}, {"key": "36062480", "model": "llama", "target_model": "llama", "recognition_score": 0.9099070064196189, "ground_truth": 1}, {"key": "36062480", "model": "llama", "target_model": "human", "recognition_score": 0.9390248243204907, "ground_truth": 0}, {"key": "36062480", "model": "llama", "target_model": "claude", "recognition_score": 0.9618217198110225, "ground_truth": 0}, {"key": "36062480", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9764905461951217, "ground_truth": 0}, {"key": "36062480", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9394706044086731, "ground_truth": 0}, {"key": "37276883", "model": "llama", "target_model": "llama", "recognition_score": 0.8210441218350273, "ground_truth": 1}, {"key": "37276883", "model": "llama", "target_model": "human", "recognition_score": 0.8832359932565468, "ground_truth": 0}, {"key": "37276883", "model": "llama", "target_model": "claude", "recognition_score": 0.8807970827255165, "ground_truth": 0}, {"key": "37276883", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9358173593914505, "ground_truth": 0}, {"key": "37276883", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9645892684389024, "ground_truth": 0}, {"key": "38509260", "model": "llama", "target_model": "llama", "recognition_score": 0.7416740275573983, "ground_truth": 1}, {"key": "38509260", "model": "llama", "target_model": "human", "recognition_score": 0.8080672032348337, "ground_truth": 0}, {"key": "38509260", "model": "llama", "target_model": "claude", "recognition_score": 0.8104788953146395, "ground_truth": 0}, {"key": "38509260", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9385759594327765, "ground_truth": 0}, {"key": "38509260", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8940517159160224, "ground_truth": 0}, {"key": "37139607", "model": "llama", "target_model": "llama", "recognition_score": 0.851952805423, "ground_truth": 1}, {"key": "37139607", "model": "llama", "target_model": "human", "recognition_score": 0.8606036319856315, "ground_truth": 0}, {"key": "37139607", "model": "llama", "target_model": "claude", "recognition_score": 0.871474861789673, "ground_truth": 0}, {"key": "37139607", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8723473706139698, "ground_truth": 0}, {"key": "37139607", "model": "llama", "target_model": "gpt35", "recognition_score": 0.808067228206549, "ground_truth": 0}, {"key": "37092824", "model": "llama", "target_model": "llama", "recognition_score": 0.9407897484931205, "ground_truth": 1}, {"key": "37092824", "model": "llama", "target_model": "human", "recognition_score": 0.9621075704487462, "ground_truth": 0}, {"key": "37092824", "model": "llama", "target_model": "claude", "recognition_score": 0.967163044813262, "ground_truth": 0}, {"key": "37092824", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9643214495331116, "ground_truth": 0}, {"key": "37092824", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8872045948400333, "ground_truth": 0}, {"key": "32191802", "model": "llama", "target_model": "llama", "recognition_score": 0.966663176519084, "ground_truth": 1}, {"key": "32191802", "model": "llama", "target_model": "human", "recognition_score": 0.9623913643302068, "ground_truth": 0}, {"key": "32191802", "model": "llama", "target_model": "claude", "recognition_score": 0.9791955067869643, "ground_truth": 0}, {"key": "32191802", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9785492701808096, "ground_truth": 0}, {"key": "32191802", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9838471642852911, "ground_truth": 0}, {"key": "39396038", "model": "llama", "target_model": "llama", "recognition_score": 0.9813106910179058, "ground_truth": 1}, {"key": "39396038", "model": "llama", "target_model": "human", "recognition_score": 0.9813106905619841, "ground_truth": 0}, {"key": "39396038", "model": "llama", "target_model": "claude", "recognition_score": 0.960951709149222, "ground_truth": 0}, {"key": "39396038", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9736446481817015, "ground_truth": 0}, {"key": "39396038", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9664104938471605, "ground_truth": 0}, {"key": "39076884", "model": "llama", "target_model": "llama", "recognition_score": 0.8489722046707844, "ground_truth": 1}, {"key": "39076884", "model": "llama", "target_model": "human", "recognition_score": 0.9219218274186138, "ground_truth": 0}, {"key": "39076884", "model": "llama", "target_model": "claude", "recognition_score": 0.8407825992605397, "ground_truth": 0}, {"key": "39076884", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8428631473703498, "ground_truth": 0}, {"key": "39076884", "model": "llama", "target_model": "gpt35", "recognition_score": 0.800691998274498, "ground_truth": 0}, {"key": "27763432", "model": "llama", "target_model": "llama", "recognition_score": 0.5486734857219792, "ground_truth": 1}, {"key": "27763432", "model": "llama", "target_model": "human", "recognition_score": 0.5273165248292673, "ground_truth": 0}, {"key": "27763432", "model": "llama", "target_model": "claude", "recognition_score": 0.3942009395504293, "ground_truth": 0}, {"key": "27763432", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5409238854981206, "ground_truth": 0}, {"key": "27763432", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4035668431119011, "ground_truth": 0}, {"key": "37806929", "model": "llama", "target_model": "llama", "recognition_score": 0.8879840496139275, "ground_truth": 1}, {"key": "37806929", "model": "llama", "target_model": "human", "recognition_score": 0.888758777834806, "ground_truth": 0}, {"key": "37806929", "model": "llama", "target_model": "claude", "recognition_score": 0.827828145243171, "ground_truth": 0}, {"key": "37806929", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8918110454495175, "ground_truth": 0}, {"key": "37806929", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8991213791763459, "ground_truth": 0}, {"key": "32334186", "model": "llama", "target_model": "llama", "recognition_score": 0.8962513741816314, "ground_truth": 1}, {"key": "32334186", "model": "llama", "target_model": "human", "recognition_score": 0.8529354812402709, "ground_truth": 0}, {"key": "32334186", "model": "llama", "target_model": "claude", "recognition_score": 0.8624675362103408, "ground_truth": 0}, {"key": "32334186", "model": "llama", "target_model": "gpt4", "recognition_score": 0.919063288728093, "ground_truth": 0}, {"key": "32334186", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7759445488382107, "ground_truth": 0}, {"key": "36187324", "model": "llama", "target_model": "llama", "recognition_score": 0.9207896733628412, "ground_truth": 1}, {"key": "36187324", "model": "llama", "target_model": "human", "recognition_score": 0.9706877686031603, "ground_truth": 0}, {"key": "36187324", "model": "llama", "target_model": "claude", "recognition_score": 0.9263037357865103, "ground_truth": 0}, {"key": "36187324", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9390248190323194, "ground_truth": 0}, {"key": "36187324", "model": "llama", "target_model": "gpt35", "recognition_score": 0.931462505407559, "ground_truth": 0}, {"key": "35306009", "model": "llama", "target_model": "llama", "recognition_score": 0.9898303412302581, "ground_truth": 1}, {"key": "35306009", "model": "llama", "target_model": "human", "recognition_score": 0.9777138155335751, "ground_truth": 0}, {"key": "35306009", "model": "llama", "target_model": "claude", "recognition_score": 0.9805806517607767, "ground_truth": 0}, {"key": "35306009", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9861513902773066, "ground_truth": 0}, {"key": "35306009", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9856076651694153, "ground_truth": 0}, {"key": "39490050", "model": "llama", "target_model": "llama", "recognition_score": 0.20946968999647905, "ground_truth": 1}, {"key": "39490050", "model": "llama", "target_model": "human", "recognition_score": 0.3157359627435159, "ground_truth": 0}, {"key": "39490050", "model": "llama", "target_model": "claude", "recognition_score": 0.2782568073989907, "ground_truth": 0}, {"key": "39490050", "model": "llama", "target_model": "gpt4", "recognition_score": 0.2689414424032013, "ground_truth": 0}, {"key": "39490050", "model": "llama", "target_model": "gpt35", "recognition_score": 0.3293916949377641, "ground_truth": 0}, {"key": "38072149", "model": "llama", "target_model": "llama", "recognition_score": 0.6424324948158056, "ground_truth": 1}, {"key": "38072149", "model": "llama", "target_model": "human", "recognition_score": 0.8080672118583735, "ground_truth": 0}, {"key": "38072149", "model": "llama", "target_model": "claude", "recognition_score": 0.6352224282192822, "ground_truth": 0}, {"key": "38072149", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8962513675846795, "ground_truth": 0}, {"key": "38072149", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8757869979936338, "ground_truth": 0}, {"key": "35899689", "model": "llama", "target_model": "llama", "recognition_score": 0.8322366585909262, "ground_truth": 1}, {"key": "35899689", "model": "llama", "target_model": "human", "recognition_score": 0.8092759756309149, "ground_truth": 0}, {"key": "35899689", "model": "llama", "target_model": "claude", "recognition_score": 0.8832359814512706, "ground_truth": 0}, {"key": "35899689", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9026095975708076, "ground_truth": 0}, {"key": "35899689", "model": "llama", "target_model": "gpt35", "recognition_score": 0.841825649502859, "ground_truth": 0}, {"key": "27994518", "model": "llama", "target_model": "llama", "recognition_score": 0.8152324892676659, "ground_truth": 1}, {"key": "27994518", "model": "llama", "target_model": "human", "recognition_score": 0.7918210842047553, "ground_truth": 0}, {"key": "27994518", "model": "llama", "target_model": "claude", "recognition_score": 0.8879840540167934, "ground_truth": 0}, {"key": "27994518", "model": "llama", "target_model": "gpt4", "recognition_score": 0.785308571134255, "ground_truth": 0}, {"key": "27994518", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6242935340710725, "ground_truth": 0}, {"key": "10615479", "model": "llama", "target_model": "llama", "recognition_score": 0.21337717310683216, "ground_truth": 1}, {"key": "10615479", "model": "llama", "target_model": "human", "recognition_score": 0.19072401842373496, "ground_truth": 0}, {"key": "10615479", "model": "llama", "target_model": "claude", "recognition_score": 0.24220563113494553, "ground_truth": 0}, {"key": "10615479", "model": "llama", "target_model": "gpt4", "recognition_score": 0.36840569989362815, "ground_truth": 0}, {"key": "10615479", "model": "llama", "target_model": "gpt35", "recognition_score": 0.20689406398151705, "ground_truth": 0}, {"key": "40186667", "model": "llama", "target_model": "llama", "recognition_score": 0.9099070050884444, "ground_truth": 1}, {"key": "40186667", "model": "llama", "target_model": "human", "recognition_score": 0.793105959983944, "ground_truth": 0}, {"key": "40186667", "model": "llama", "target_model": "claude", "recognition_score": 0.9224823447957387, "ground_truth": 0}, {"key": "40186667", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9314625132112359, "ground_truth": 0}, {"key": "40186667", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8469578378995247, "ground_truth": 0}, {"key": "38622886", "model": "llama", "target_model": "llama", "recognition_score": 0.9224823509921949, "ground_truth": 1}, {"key": "38622886", "model": "llama", "target_model": "human", "recognition_score": 0.5544704601600894, "ground_truth": 0}, {"key": "38622886", "model": "llama", "target_model": "claude", "recognition_score": 0.9092645056774064, "ground_truth": 0}, {"key": "38622886", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9278877996193017, "ground_truth": 0}, {"key": "38622886", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8848377602242128, "ground_truth": 0}, {"key": "40686943", "model": "llama", "target_model": "llama", "recognition_score": 0.7446563157464025, "ground_truth": 1}, {"key": "40686943", "model": "llama", "target_model": "human", "recognition_score": 0.815232498197873, "ground_truth": 0}, {"key": "40686943", "model": "llama", "target_model": "claude", "recognition_score": 0.8902942274021604, "ground_truth": 0}, {"key": "40686943", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8365545714418917, "ground_truth": 0}, {"key": "40686943", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9053222943477258, "ground_truth": 0}, {"key": "30604567", "model": "llama", "target_model": "llama", "recognition_score": 0.9824231160807952, "ground_truth": 1}, {"key": "30604567", "model": "llama", "target_model": "human", "recognition_score": 0.9835969692370957, "ground_truth": 0}, {"key": "30604567", "model": "llama", "target_model": "claude", "recognition_score": 0.9690910395004987, "ground_truth": 0}, {"key": "30604567", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9768465901598771, "ground_truth": 0}, {"key": "30604567", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9773708006320218, "ground_truth": 0}, {"key": "35440903", "model": "llama", "target_model": "llama", "recognition_score": 0.8344068947320945, "ground_truth": 1}, {"key": "35440903", "model": "llama", "target_model": "human", "recognition_score": 0.8092759824013381, "ground_truth": 0}, {"key": "35440903", "model": "llama", "target_model": "claude", "recognition_score": 0.8947894629011311, "ground_truth": 0}, {"key": "35440903", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7905303281918424, "ground_truth": 0}, {"key": "35440903", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8311430611772932, "ground_truth": 0}, {"key": "37219533", "model": "llama", "target_model": "llama", "recognition_score": 0.5078118690082142, "ground_truth": 1}, {"key": "37219533", "model": "llama", "target_model": "human", "recognition_score": 0.6076631878527902, "ground_truth": 0}, {"key": "37219533", "model": "llama", "target_model": "claude", "recognition_score": 0.5525397208811569, "ground_truth": 0}, {"key": "37219533", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5525397107517402, "ground_truth": 0}, {"key": "37219533", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6926419851521414, "ground_truth": 0}, {"key": "40178965", "model": "llama", "target_model": "llama", "recognition_score": 0.9600626845059193, "ground_truth": 1}, {"key": "40178965", "model": "llama", "target_model": "human", "recognition_score": 0.9640516750879535, "ground_truth": 0}, {"key": "40178965", "model": "llama", "target_model": "claude", "recognition_score": 0.9092645127017738, "ground_truth": 0}, {"key": "40178965", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9412234496615794, "ground_truth": 0}, {"key": "40178965", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9539660994969672, "ground_truth": 0}, {"key": "13750468", "model": "llama", "target_model": "llama", "recognition_score": 0.6279512212778394, "ground_truth": 1}, {"key": "13750468", "model": "llama", "target_model": "human", "recognition_score": 0.7879311800982782, "ground_truth": 0}, {"key": "13750468", "model": "llama", "target_model": "claude", "recognition_score": 0.835483560248679, "ground_truth": 0}, {"key": "13750468", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7295197970987037, "ground_truth": 0}, {"key": "13750468", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7534666419850022, "ground_truth": 0}, {"key": "17754949", "model": "llama", "target_model": "llama", "recognition_score": 0.7505527623183045, "ground_truth": 1}, {"key": "17754949", "model": "llama", "target_model": "human", "recognition_score": 0.4205995991109218, "ground_truth": 0}, {"key": "17754949", "model": "llama", "target_model": "claude", "recognition_score": 0.8386797657232388, "ground_truth": 0}, {"key": "17754949", "model": "llama", "target_model": "gpt4", "recognition_score": 0.787931222710584, "ground_truth": 0}, {"key": "17754949", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8991213852393625, "ground_truth": 0}, {"key": "36675623", "model": "llama", "target_model": "llama", "recognition_score": 0.977370801235632, "ground_truth": 1}, {"key": "36675623", "model": "llama", "target_model": "human", "recognition_score": 0.984093607470184, "ground_truth": 0}, {"key": "36675623", "model": "llama", "target_model": "claude", "recognition_score": 0.9653811605687408, "ground_truth": 0}, {"key": "36675623", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9429285955387887, "ground_truth": 0}, {"key": "36675623", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9734434285280819, "ground_truth": 0}, {"key": "40035440", "model": "llama", "target_model": "llama", "recognition_score": 0.9930423919930828, "ground_truth": 1}, {"key": "40035440", "model": "llama", "target_model": "human", "recognition_score": 0.9884026382689763, "ground_truth": 0}, {"key": "40035440", "model": "llama", "target_model": "claude", "recognition_score": 0.9511422214865781, "ground_truth": 0}, {"key": "40035440", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9773707995738495, "ground_truth": 0}, {"key": "40035440", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9895109079809827, "ground_truth": 0}, {"key": "37685909", "model": "llama", "target_model": "llama", "recognition_score": 0.5888891174932211, "ground_truth": 1}, {"key": "37685909", "model": "llama", "target_model": "human", "recognition_score": 0.4882834061314722, "ground_truth": 0}, {"key": "37685909", "model": "llama", "target_model": "claude", "recognition_score": 0.6424324736391813, "ground_truth": 0}, {"key": "37685909", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5350984290974717, "ground_truth": 0}, {"key": "37685909", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5156199098698148, "ground_truth": 0}, {"key": "36938787", "model": "llama", "target_model": "llama", "recognition_score": 0.7057850254097384, "ground_truth": 1}, {"key": "36938787", "model": "llama", "target_model": "human", "recognition_score": 0.6723317106049095, "ground_truth": 0}, {"key": "36938787", "model": "llama", "target_model": "claude", "recognition_score": 0.7356416283154964, "ground_truth": 0}, {"key": "36938787", "model": "llama", "target_model": "gpt4", "recognition_score": 0.694302663291878, "ground_truth": 0}, {"key": "36938787", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7969253634583814, "ground_truth": 0}, {"key": "39398068", "model": "llama", "target_model": "llama", "recognition_score": 0.5717665924154699, "ground_truth": 1}, {"key": "39398068", "model": "llama", "target_model": "human", "recognition_score": 0.4804786448160244, "ground_truth": 0}, {"key": "39398068", "model": "llama", "target_model": "claude", "recognition_score": 0.7943849696735475, "ground_truth": 0}, {"key": "39398068", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7138307306246381, "ground_truth": 0}, {"key": "39398068", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7606506449065245, "ground_truth": 0}, {"key": "39926408", "model": "llama", "target_model": "llama", "recognition_score": 0.7490872191895371, "ground_truth": 1}, {"key": "39926408", "model": "llama", "target_model": "human", "recognition_score": 0.908617892469195, "ground_truth": 0}, {"key": "39926408", "model": "llama", "target_model": "claude", "recognition_score": 0.6959583186612208, "ground_truth": 0}, {"key": "39926408", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8418256424378764, "ground_truth": 0}, {"key": "39926408", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7879311956951306, "ground_truth": 0}, {"key": "40465336", "model": "llama", "target_model": "llama", "recognition_score": 0.8705972646500015, "ground_truth": 1}, {"key": "40465336", "model": "llama", "target_model": "human", "recognition_score": 0.8044059159324415, "ground_truth": 0}, {"key": "40465336", "model": "llama", "target_model": "claude", "recognition_score": 0.8848377766615912, "ground_truth": 0}, {"key": "40465336", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8459424372173058, "ground_truth": 0}, {"key": "40465336", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8976953003832341, "ground_truth": 0}, {"key": "34173549", "model": "llama", "target_model": "llama", "recognition_score": 0.7341194951915996, "ground_truth": 1}, {"key": "34173549", "model": "llama", "target_model": "human", "recognition_score": 0.9284087954372237, "ground_truth": 0}, {"key": "34173549", "model": "llama", "target_model": "claude", "recognition_score": 0.7799929138114992, "ground_truth": 0}, {"key": "34173549", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8984105570508532, "ground_truth": 0}, {"key": "34173549", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8962513718792297, "ground_truth": 0}, {"key": "33541535", "model": "llama", "target_model": "llama", "recognition_score": 0.9572778023593306, "ground_truth": 1}, {"key": "33541535", "model": "llama", "target_model": "human", "recognition_score": 0.8469578345475257, "ground_truth": 0}, {"key": "33541535", "model": "llama", "target_model": "claude", "recognition_score": 0.8962513762202067, "ground_truth": 0}, {"key": "33541535", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8918110428880481, "ground_truth": 0}, {"key": "33541535", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9437636580474149, "ground_truth": 0}, {"key": "35685195", "model": "llama", "target_model": "llama", "recognition_score": 0.9224823481190138, "ground_truth": 1}, {"key": "35685195", "model": "llama", "target_model": "human", "recognition_score": 0.7248702625792365, "ground_truth": 0}, {"key": "35685195", "model": "llama", "target_model": "claude", "recognition_score": 0.8925625157475374, "ground_truth": 0}, {"key": "35685195", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8652240892335591, "ground_truth": 0}, {"key": "35685195", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8397339633497862, "ground_truth": 0}, {"key": "28440730", "model": "llama", "target_model": "llama", "recognition_score": 0.22405545252452252, "ground_truth": 1}, {"key": "28440730", "model": "llama", "target_model": "human", "recognition_score": 0.4629585919296942, "ground_truth": 0}, {"key": "28440730", "model": "llama", "target_model": "claude", "recognition_score": 0.5292634060917097, "ground_truth": 0}, {"key": "28440730", "model": "llama", "target_model": "gpt4", "recognition_score": 0.343341731629333, "ground_truth": 0}, {"key": "28440730", "model": "llama", "target_model": "gpt35", "recognition_score": 0.2689414164157599, "ground_truth": 0}, {"key": "38338714", "model": "llama", "target_model": "llama", "recognition_score": 0.9579122712966389, "ground_truth": 1}, {"key": "38338714", "model": "llama", "target_model": "human", "recognition_score": 0.9319595772720152, "ground_truth": 0}, {"key": "38338714", "model": "llama", "target_model": "claude", "recognition_score": 0.9615338074817301, "ground_truth": 0}, {"key": "38338714", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9394706105031143, "ground_truth": 0}, {"key": "38338714", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9367494744811793, "ground_truth": 0}, {"key": "32191881", "model": "llama", "target_model": "llama", "recognition_score": 0.49218813601279165, "ground_truth": 1}, {"key": "32191881", "model": "llama", "target_model": "human", "recognition_score": 0.24944723822479017, "ground_truth": 0}, {"key": "32191881", "model": "llama", "target_model": "claude", "recognition_score": 0.3867634495109305, "ground_truth": 0}, {"key": "32191881", "model": "llama", "target_model": "gpt4", "recognition_score": 0.33458943837715044, "ground_truth": 0}, {"key": "32191881", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5058590794670175, "ground_truth": 0}, {"key": "37707251", "model": "llama", "target_model": "llama", "recognition_score": 0.6460136859939807, "ground_truth": 1}, {"key": "37707251", "model": "llama", "target_model": "human", "recognition_score": 0.8740772368449922, "ground_truth": 0}, {"key": "37707251", "model": "llama", "target_model": "claude", "recognition_score": 0.8128673094770431, "ground_truth": 0}, {"key": "37707251", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8757869979557288, "ground_truth": 0}, {"key": "37707251", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7994423128926929, "ground_truth": 0}, {"key": "40172567", "model": "llama", "target_model": "llama", "recognition_score": 0.5832033600580511, "ground_truth": 1}, {"key": "40172567", "model": "llama", "target_model": "human", "recognition_score": 0.6584174869428375, "ground_truth": 0}, {"key": "40172567", "model": "llama", "target_model": "claude", "recognition_score": 0.3979383990303769, "ground_truth": 0}, {"key": "40172567", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7549149785115981, "ground_truth": 0}, {"key": "40172567", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6723316683325431, "ground_truth": 0}, {"key": "33113255", "model": "llama", "target_model": "llama", "recognition_score": 0.9219218323059304, "ground_truth": 1}, {"key": "33113255", "model": "llama", "target_model": "human", "recognition_score": 0.9252299624468818, "ground_truth": 0}, {"key": "33113255", "model": "llama", "target_model": "claude", "recognition_score": 0.9329437185139706, "ground_truth": 0}, {"key": "33113255", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9039745062509084, "ground_truth": 0}, {"key": "33113255", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9485372381667561, "ground_truth": 0}, {"key": "33022143", "model": "llama", "target_model": "llama", "recognition_score": 0.6057990680180895, "ground_truth": 1}, {"key": "33022143", "model": "llama", "target_model": "human", "recognition_score": 0.5717665731590517, "ground_truth": 0}, {"key": "33022143", "model": "llama", "target_model": "claude", "recognition_score": 0.48633152565640186, "ground_truth": 0}, {"key": "33022143", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6808786132449354, "ground_truth": 0}, {"key": "33022143", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5794003921288564, "ground_truth": 0}, {"key": "32084473", "model": "llama", "target_model": "llama", "recognition_score": 0.9343951593625391, "ground_truth": 1}, {"key": "32084473", "model": "llama", "target_model": "human", "recognition_score": 0.9603611596493059, "ground_truth": 0}, {"key": "32084473", "model": "llama", "target_model": "claude", "recognition_score": 0.9849273715243648, "ground_truth": 0}, {"key": "32084473", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9525741267719486, "ground_truth": 0}, {"key": "32084473", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9688561703084366, "ground_truth": 0}, {"key": "40564245", "model": "llama", "target_model": "llama", "recognition_score": 0.4263215999078941, "ground_truth": 1}, {"key": "40564245", "model": "llama", "target_model": "human", "recognition_score": 0.9343951641924564, "ground_truth": 0}, {"key": "40564245", "model": "llama", "target_model": "claude", "recognition_score": 0.7520125817073771, "ground_truth": 0}, {"key": "40564245", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6584174548468369, "ground_truth": 0}, {"key": "40564245", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8244619393611623, "ground_truth": 0}, {"key": "31717213", "model": "llama", "target_model": "llama", "recognition_score": 0.910545394541871, "ground_truth": 1}, {"key": "31717213", "model": "llama", "target_model": "human", "recognition_score": 0.7074047084541117, "ground_truth": 0}, {"key": "31717213", "model": "llama", "target_model": "claude", "recognition_score": 0.8757869813202782, "ground_truth": 0}, {"key": "31717213", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7279754491802898, "ground_truth": 0}, {"key": "31717213", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8509647050462616, "ground_truth": 0}, {"key": "34861894", "model": "llama", "target_model": "llama", "recognition_score": 0.8031737997106735, "ground_truth": 1}, {"key": "34861894", "model": "llama", "target_model": "human", "recognition_score": 0.6959583108135324, "ground_truth": 0}, {"key": "34861894", "model": "llama", "target_model": "claude", "recognition_score": 0.7057850449507507, "ground_truth": 0}, {"key": "34861894", "model": "llama", "target_model": "gpt4", "recognition_score": 0.865224065200389, "ground_truth": 0}, {"key": "34861894", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7106283215461665, "ground_truth": 0}, {"key": "40838760", "model": "llama", "target_model": "llama", "recognition_score": 0.959459261657584, "ground_truth": 1}, {"key": "40838760", "model": "llama", "target_model": "human", "recognition_score": 0.9782188279946518, "ground_truth": 0}, {"key": "40838760", "model": "llama", "target_model": "claude", "recognition_score": 0.9124361550511702, "ground_truth": 0}, {"key": "40838760", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8116760084376508, "ground_truth": 0}, {"key": "40838760", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9142907204837287, "ground_truth": 0}, {"key": "40044849", "model": "llama", "target_model": "llama", "recognition_score": 0.962952830416441, "ground_truth": 1}, {"key": "40044849", "model": "llama", "target_model": "human", "recognition_score": 0.8902942235503003, "ground_truth": 0}, {"key": "40044849", "model": "llama", "target_model": "claude", "recognition_score": 0.856812308777757, "ground_truth": 0}, {"key": "40044849", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9381240105248488, "ground_truth": 0}, {"key": "40044849", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9207896715242533, "ground_truth": 0}, {"key": "30296116", "model": "llama", "target_model": "llama", "recognition_score": 0.5214711453486054, "ground_truth": 1}, {"key": "30296116", "model": "llama", "target_model": "human", "recognition_score": 0.6001883675456055, "ground_truth": 0}, {"key": "30296116", "model": "llama", "target_model": "claude", "recognition_score": 0.7248703038112866, "ground_truth": 0}, {"key": "30296116", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6388352756694229, "ground_truth": 0}, {"key": "30296116", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4941408864965346, "ground_truth": 0}, {"key": "34931360", "model": "llama", "target_model": "llama", "recognition_score": 0.9118099485753559, "ground_truth": 1}, {"key": "34931360", "model": "llama", "target_model": "human", "recognition_score": 0.7122322030206738, "ground_truth": 0}, {"key": "34931360", "model": "llama", "target_model": "claude", "recognition_score": 0.5448014030205701, "ground_truth": 0}, {"key": "34931360", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7341195393835207, "ground_truth": 0}, {"key": "34931360", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7431680236458649, "ground_truth": 0}, {"key": "18862422", "model": "llama", "target_model": "llama", "recognition_score": 0.616935849691936, "ground_truth": 1}, {"key": "18862422", "model": "llama", "target_model": "human", "recognition_score": 0.8244619276004941, "ground_truth": 0}, {"key": "18862422", "model": "llama", "target_model": "claude", "recognition_score": 0.6706083144142188, "ground_truth": 0}, {"key": "18862422", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8568122960230985, "ground_truth": 0}, {"key": "18862422", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7662936557806724, "ground_truth": 0}, {"key": "36361140", "model": "llama", "target_model": "llama", "recognition_score": 0.985718066440707, "ground_truth": 1}, {"key": "36361140", "model": "llama", "target_model": "human", "recognition_score": 0.9807288629453845, "ground_truth": 0}, {"key": "36361140", "model": "llama", "target_model": "claude", "recognition_score": 0.9783846671320598, "ground_truth": 0}, {"key": "36361140", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9811668698130764, "ground_truth": 0}, {"key": "36361140", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9695556505480758, "ground_truth": 0}, {"key": "39703329", "model": "llama", "target_model": "llama", "recognition_score": 0.20434189641175396, "ground_truth": 1}, {"key": "39703329", "model": "llama", "target_model": "human", "recognition_score": 0.5234203355282797, "ground_truth": 0}, {"key": "39703329", "model": "llama", "target_model": "claude", "recognition_score": 0.370225378962516, "ground_truth": 0}, {"key": "39703329", "model": "llama", "target_model": "gpt4", "recognition_score": 0.46879060164952213, "ground_truth": 0}, {"key": "39703329", "model": "llama", "target_model": "gpt35", "recognition_score": 0.4378234820055866, "ground_truth": 0}, {"key": "34033324", "model": "llama", "target_model": "llama", "recognition_score": 0.9825575154661957, "ground_truth": 1}, {"key": "34033324", "model": "llama", "target_model": "human", "recognition_score": 0.9810219657662792, "ground_truth": 0}, {"key": "34033324", "model": "llama", "target_model": "claude", "recognition_score": 0.9339146152140639, "ground_truth": 0}, {"key": "34033324", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9872772910104125, "ground_truth": 0}, {"key": "34033324", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9706877696343907, "ground_truth": 0}, {"key": "35658862", "model": "llama", "target_model": "llama", "recognition_score": 0.8397339694742717, "ground_truth": 1}, {"key": "35658862", "model": "llama", "target_model": "human", "recognition_score": 0.9566342019983496, "ground_truth": 0}, {"key": "35658862", "model": "llama", "target_model": "claude", "recognition_score": 0.922482334986921, "ground_truth": 0}, {"key": "35658862", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8577681065665457, "ground_truth": 0}, {"key": "35658862", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7662936637403923, "ground_truth": 0}, {"key": "36092657", "model": "llama", "target_model": "llama", "recognition_score": 0.9099070147799211, "ground_truth": 1}, {"key": "36092657", "model": "llama", "target_model": "human", "recognition_score": 0.8872045865992692, "ground_truth": 0}, {"key": "36092657", "model": "llama", "target_model": "claude", "recognition_score": 0.9196425326329484, "ground_truth": 0}, {"key": "36092657", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8386797550981034, "ground_truth": 0}, {"key": "36092657", "model": "llama", "target_model": "gpt35", "recognition_score": 0.936749474838422, "ground_truth": 0}, {"key": "26333438", "model": "llama", "target_model": "llama", "recognition_score": 0.8529354850611606, "ground_truth": 1}, {"key": "26333438", "model": "llama", "target_model": "human", "recognition_score": 0.7956581083569115, "ground_truth": 0}, {"key": "26333438", "model": "llama", "target_model": "claude", "recognition_score": 0.8056322166522923, "ground_truth": 0}, {"key": "26333438", "model": "llama", "target_model": "gpt4", "recognition_score": 0.74613900006728, "ground_truth": 0}, {"key": "26333438", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7431680106192161, "ground_truth": 0}, {"key": "34184963", "model": "llama", "target_model": "llama", "recognition_score": 0.6206216103045609, "ground_truth": 1}, {"key": "34184963", "model": "llama", "target_model": "human", "recognition_score": 0.7170118715455952, "ground_truth": 0}, {"key": "34184963", "model": "llama", "target_model": "claude", "recognition_score": 0.426321598834159, "ground_truth": 0}, {"key": "34184963", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6495786338453552, "ground_truth": 0}, {"key": "34184963", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5544704620551199, "ground_truth": 0}, {"key": "35069975", "model": "llama", "target_model": "llama", "recognition_score": 0.5350984539150911, "ground_truth": 1}, {"key": "35069975", "model": "llama", "target_model": "human", "recognition_score": 0.7648916263108747, "ground_truth": 0}, {"key": "35069975", "model": "llama", "target_model": "claude", "recognition_score": 0.7662936461100337, "ground_truth": 0}, {"key": "35069975", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7185944061177596, "ground_truth": 0}, {"key": "35069975", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5813030975989408, "ground_truth": 0}, {"key": "36443950", "model": "llama", "target_model": "llama", "recognition_score": 0.6513548505519012, "ground_truth": 1}, {"key": "36443950", "model": "llama", "target_model": "human", "recognition_score": 0.6442251137079722, "ground_truth": 0}, {"key": "36443950", "model": "llama", "target_model": "claude", "recognition_score": 0.6757646203548335, "ground_truth": 0}, {"key": "36443950", "model": "llama", "target_model": "gpt4", "recognition_score": 0.65312692644936, "ground_truth": 0}, {"key": "36443950", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5717666054757417, "ground_truth": 0}, {"key": "29460858", "model": "llama", "target_model": "llama", "recognition_score": 0.629774618666727, "ground_truth": 1}, {"key": "29460858", "model": "llama", "target_model": "human", "recognition_score": 0.37937838538251767, "ground_truth": 0}, {"key": "29460858", "model": "llama", "target_model": "claude", "recognition_score": 0.6808786186233934, "ground_truth": 0}, {"key": "29460858", "model": "llama", "target_model": "gpt4", "recognition_score": 0.33458945675063795, "ground_truth": 0}, {"key": "29460858", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6723316989949463, "ground_truth": 0}, {"key": "36155704", "model": "llama", "target_model": "llama", "recognition_score": 0.3757064432133711, "ground_truth": 1}, {"key": "36155704", "model": "llama", "target_model": "human", "recognition_score": 0.575588035188089, "ground_truth": 0}, {"key": "36155704", "model": "llama", "target_model": "claude", "recognition_score": 0.5136684723155612, "ground_truth": 0}, {"key": "36155704", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5964331370592362, "ground_truth": 0}, {"key": "36155704", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "37185211", "model": "llama", "target_model": "llama", "recognition_score": 0.9334308073581987, "ground_truth": 1}, {"key": "37185211", "model": "llama", "target_model": "human", "recognition_score": 0.9202179945732417, "ground_truth": 0}, {"key": "37185211", "model": "llama", "target_model": "claude", "recognition_score": 0.9278877920630202, "ground_truth": 0}, {"key": "37185211", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9353465082954119, "ground_truth": 0}, {"key": "37185211", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9136765209660096, "ground_truth": 0}, {"key": "36454885", "model": "llama", "target_model": "llama", "recognition_score": 0.8322366508843972, "ground_truth": 1}, {"key": "36454885", "model": "llama", "target_model": "human", "recognition_score": 0.7892337051426407, "ground_truth": 0}, {"key": "36454885", "model": "llama", "target_model": "claude", "recognition_score": 0.7813306248684346, "ground_truth": 0}, {"key": "36454885", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9012274196863627, "ground_truth": 0}, {"key": "36454885", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8539127572226581, "ground_truth": 0}, {"key": "33148906", "model": "llama", "target_model": "llama", "recognition_score": 0.35220177442149064, "ground_truth": 1}, {"key": "33148906", "model": "llama", "target_model": "human", "recognition_score": 0.26894144045432, "ground_truth": 0}, {"key": "33148906", "model": "llama", "target_model": "claude", "recognition_score": 0.47463114423734265, "ground_truth": 0}, {"key": "33148906", "model": "llama", "target_model": "gpt4", "recognition_score": 0.44939265202944384, "ground_truth": 0}, {"key": "33148906", "model": "llama", "target_model": "gpt35", "recognition_score": 0.33285233080826704, "ground_truth": 0}, {"key": "18086604", "model": "llama", "target_model": "llama", "recognition_score": 0.37022538636859614, "ground_truth": 1}, {"key": "18086604", "model": "llama", "target_model": "human", "recognition_score": 0.6876299806666437, "ground_truth": 0}, {"key": "18086604", "model": "llama", "target_model": "claude", "recognition_score": 0.41111085719796714, "ground_truth": 0}, {"key": "18086604", "model": "llama", "target_model": "gpt4", "recognition_score": 0.21076629389593746, "ground_truth": 0}, {"key": "18086604", "model": "llama", "target_model": "gpt35", "recognition_score": 0.49218813687826024, "ground_truth": 0}, {"key": "33693397", "model": "llama", "target_model": "llama", "recognition_score": 0.7943849587611348, "ground_truth": 1}, {"key": "33693397", "model": "llama", "target_model": "human", "recognition_score": 0.7371581595199649, "ground_truth": 0}, {"key": "33693397", "model": "llama", "target_model": "claude", "recognition_score": 0.7918210527417507, "ground_truth": 0}, {"key": "33693397", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7248702913586476, "ground_truth": 0}, {"key": "33693397", "model": "llama", "target_model": "gpt35", "recognition_score": 0.702530051251516, "ground_truth": 0}, {"key": "39501530", "model": "llama", "target_model": "llama", "recognition_score": 0.3923368113059107, "ground_truth": 1}, {"key": "39501530", "model": "llama", "target_model": "human", "recognition_score": 0.3849121380703095, "ground_truth": 0}, {"key": "39501530", "model": "llama", "target_model": "claude", "recognition_score": 0.30404166925529635, "ground_truth": 0}, {"key": "39501530", "model": "llama", "target_model": "gpt4", "recognition_score": 0.30404166669592314, "ground_truth": 0}, {"key": "39501530", "model": "llama", "target_model": "gpt35", "recognition_score": 0.22000710033399212, "ground_truth": 0}, {"key": "30948874", "model": "llama", "target_model": "llama", "recognition_score": 0.9173026569617584, "ground_truth": 1}, {"key": "30948874", "model": "llama", "target_model": "human", "recognition_score": 0.907967144712895, "ground_truth": 0}, {"key": "30948874", "model": "llama", "target_model": "claude", "recognition_score": 0.9579122687505698, "ground_truth": 0}, {"key": "30948874", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9130583389483241, "ground_truth": 0}, {"key": "30948874", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8895288499168811, "ground_truth": 0}, {"key": "39410675", "model": "llama", "target_model": "llama", "recognition_score": 0.8766343777446595, "ground_truth": 1}, {"key": "39410675", "model": "llama", "target_model": "human", "recognition_score": 0.896251371474433, "ground_truth": 0}, {"key": "39410675", "model": "llama", "target_model": "claude", "recognition_score": 0.925229954298839, "ground_truth": 0}, {"key": "39410675", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9149009503298524, "ground_truth": 0}, {"key": "39410675", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9167080771882483, "ground_truth": 0}, {"key": "32903337", "model": "llama", "target_model": "llama", "recognition_score": 0.5717666077473812, "ground_truth": 1}, {"key": "32903337", "model": "llama", "target_model": "human", "recognition_score": 0.5331544105913559, "ground_truth": 0}, {"key": "32903337", "model": "llama", "target_model": "claude", "recognition_score": 0.667147696234115, "ground_truth": 0}, {"key": "32903337", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8311430497353273, "ground_truth": 0}, {"key": "32903337", "model": "llama", "target_model": "gpt35", "recognition_score": 0.5331543923018037, "ground_truth": 0}, {"key": "27685132", "model": "llama", "target_model": "llama", "recognition_score": 0.8749346120313862, "ground_truth": 1}, {"key": "27685132", "model": "llama", "target_model": "human", "recognition_score": 0.7505527560447268, "ground_truth": 0}, {"key": "27685132", "model": "llama", "target_model": "claude", "recognition_score": 0.7490872153708932, "ground_truth": 0}, {"key": "27685132", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8529354722411525, "ground_truth": 0}, {"key": "27685132", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6791786768023091, "ground_truth": 0}, {"key": "22791471", "model": "llama", "target_model": "llama", "recognition_score": 0.7994423049294901, "ground_truth": 1}, {"key": "22791471", "model": "llama", "target_model": "human", "recognition_score": 0.8418256503904111, "ground_truth": 0}, {"key": "22791471", "model": "llama", "target_model": "claude", "recognition_score": 0.8902942295841423, "ground_truth": 0}, {"key": "22791471", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8807970861579817, "ground_truth": 0}, {"key": "22791471", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8365545467077294, "ground_truth": 0}, {"key": "32292348", "model": "llama", "target_model": "llama", "recognition_score": 0.8365545615244392, "ground_truth": 1}, {"key": "32292348", "model": "llama", "target_model": "human", "recognition_score": 0.8289388156192714, "ground_truth": 0}, {"key": "32292348", "model": "llama", "target_model": "claude", "recognition_score": 0.7676898730341268, "ground_truth": 0}, {"key": "32292348", "model": "llama", "target_model": "gpt4", "recognition_score": 0.815232491623764, "ground_truth": 0}, {"key": "32292348", "model": "llama", "target_model": "gpt35", "recognition_score": 0.809275982013155, "ground_truth": 0}, {"key": "20482930", "model": "llama", "target_model": "llama", "recognition_score": 0.8376199518408942, "ground_truth": 1}, {"key": "20482930", "model": "llama", "target_model": "human", "recognition_score": 0.7634837771904386, "ground_truth": 0}, {"key": "20482930", "model": "llama", "target_model": "claude", "recognition_score": 0.7839884469666618, "ground_truth": 0}, {"key": "20482930", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8255897121934986, "ground_truth": 0}, {"key": "20482930", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8479677603329467, "ground_truth": 0}, {"key": "11635754", "model": "llama", "target_model": "llama", "recognition_score": 0.892562523191851, "ground_truth": 1}, {"key": "11635754", "model": "llama", "target_model": "human", "recognition_score": 0.72017148860717, "ground_truth": 0}, {"key": "11635754", "model": "llama", "target_model": "claude", "recognition_score": 0.8386797573568172, "ground_truth": 0}, {"key": "11635754", "model": "llama", "target_model": "gpt4", "recognition_score": 0.857768102405152, "ground_truth": 0}, {"key": "11635754", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9319595729113158, "ground_truth": 0}, {"key": "40029096", "model": "llama", "target_model": "llama", "recognition_score": 0.8615382125672081, "ground_truth": 1}, {"key": "40029096", "model": "llama", "target_model": "human", "recognition_score": 0.8489721933390575, "ground_truth": 0}, {"key": "40029096", "model": "llama", "target_model": "claude", "recognition_score": 0.743168015851565, "ground_truth": 0}, {"key": "40029096", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7956581245142991, "ground_truth": 0}, {"key": "40029096", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7732163764861064, "ground_truth": 0}, {"key": "40414719", "model": "llama", "target_model": "llama", "recognition_score": 0.9600626864765939, "ground_truth": 1}, {"key": "40414719", "model": "llama", "target_model": "human", "recognition_score": 0.9770226303217222, "ground_truth": 0}, {"key": "40414719", "model": "llama", "target_model": "claude", "recognition_score": 0.9399133499880429, "ground_truth": 0}, {"key": "40414719", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9742394428815718, "ground_truth": 0}, {"key": "40414719", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9669140211164116, "ground_truth": 0}, {"key": "39537616", "model": "llama", "target_model": "llama", "recognition_score": 0.9319595769980458, "ground_truth": 1}, {"key": "39537616", "model": "llama", "target_model": "human", "recognition_score": 0.9005297868747533, "ground_truth": 0}, {"key": "39537616", "model": "llama", "target_model": "claude", "recognition_score": 0.9032942037027787, "ground_truth": 0}, {"key": "39537616", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7690802341449956, "ground_truth": 0}, {"key": "39537616", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8799743780535757, "ground_truth": 0}, {"key": "33245830", "model": "llama", "target_model": "llama", "recognition_score": 0.28457600761299584, "ground_truth": 1}, {"key": "33245830", "model": "llama", "target_model": "human", "recognition_score": 0.3942009684788906, "ground_truth": 0}, {"key": "33245830", "model": "llama", "target_model": "claude", "recognition_score": 0.2043418837961603, "ground_truth": 0}, {"key": "33245830", "model": "llama", "target_model": "gpt4", "recognition_score": 0.235108405122138, "ground_truth": 0}, {"key": "33245830", "model": "llama", "target_model": "gpt35", "recognition_score": 0.33633106287415965, "ground_truth": 0}, {"key": "39243601", "model": "llama", "target_model": "llama", "recognition_score": 0.5945512752643739, "ground_truth": 1}, {"key": "39243601", "model": "llama", "target_model": "human", "recognition_score": 0.4167966253271578, "ground_truth": 0}, {"key": "39243601", "model": "llama", "target_model": "claude", "recognition_score": 0.6636689442240383, "ground_truth": 0}, {"key": "39243601", "model": "llama", "target_model": "gpt4", "recognition_score": 0.5774953502649867, "ground_truth": 0}, {"key": "39243601", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7122321895139184, "ground_truth": 0}, {"key": "35815905", "model": "llama", "target_model": "llama", "recognition_score": 0.6654105500512966, "ground_truth": 1}, {"key": "35815905", "model": "llama", "target_model": "human", "recognition_score": 0.646013706317084, "ground_truth": 0}, {"key": "35815905", "model": "llama", "target_model": "claude", "recognition_score": 0.7217432166712301, "ground_truth": 0}, {"key": "35815905", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8397339692348371, "ground_truth": 0}, {"key": "35815905", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6959583112755904, "ground_truth": 0}, {"key": "35260212", "model": "llama", "target_model": "llama", "recognition_score": 0.8705972806456356, "ground_truth": 1}, {"key": "35260212", "model": "llama", "target_model": "human", "recognition_score": 0.7813306332098828, "ground_truth": 0}, {"key": "35260212", "model": "llama", "target_model": "claude", "recognition_score": 0.7577943650603001, "ground_truth": 0}, {"key": "35260212", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9130583473296172, "ground_truth": 0}, {"key": "35260212", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9167080897329698, "ground_truth": 0}, {"key": "39193924", "model": "llama", "target_model": "llama", "recognition_score": 0.39047584878831565, "ground_truth": 1}, {"key": "39193924", "model": "llama", "target_model": "human", "recognition_score": 0.8175744755572424, "ground_truth": 0}, {"key": "39193924", "model": "llama", "target_model": "claude", "recognition_score": 0.6388352783909083, "ground_truth": 0}, {"key": "39193924", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6352224553842643, "ground_truth": 0}, {"key": "39193924", "model": "llama", "target_model": "gpt35", "recognition_score": 0.811676020251986, "ground_truth": 0}, {"key": "40658569", "model": "llama", "target_model": "llama", "recognition_score": 0.6001883520933617, "ground_truth": 1}, {"key": "40658569", "model": "llama", "target_model": "human", "recognition_score": 0.44167303537826547, "ground_truth": 0}, {"key": "40658569", "model": "llama", "target_model": "claude", "recognition_score": 0.7634837608004374, "ground_truth": 0}, {"key": "40658569", "model": "llama", "target_model": "gpt4", "recognition_score": 0.6688802718164496, "ground_truth": 0}, {"key": "40658569", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6842640123116267, "ground_truth": 0}, {"key": "33497596", "model": "llama", "target_model": "llama", "recognition_score": 0.9026096020355415, "ground_truth": 1}, {"key": "33497596", "model": "llama", "target_model": "human", "recognition_score": 0.8289388162026272, "ground_truth": 0}, {"key": "33497596", "model": "llama", "target_model": "claude", "recognition_score": 0.9105454008965941, "ground_truth": 0}, {"key": "33497596", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8459424385896164, "ground_truth": 0}, {"key": "33497596", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8558511432705108, "ground_truth": 0}, {"key": "40339241", "model": "llama", "target_model": "llama", "recognition_score": 0.8714748589677714, "ground_truth": 1}, {"key": "40339241", "model": "llama", "target_model": "human", "recognition_score": 0.8955226696643858, "ground_truth": 0}, {"key": "40339241", "model": "llama", "target_model": "claude", "recognition_score": 0.9124361565858988, "ground_truth": 0}, {"key": "40339241", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8740772393529552, "ground_truth": 0}, {"key": "40339241", "model": "llama", "target_model": "gpt35", "recognition_score": 0.743167989600867, "ground_truth": 0}, {"key": "31792608", "model": "llama", "target_model": "llama", "recognition_score": 0.7931059559167296, "ground_truth": 1}, {"key": "31792608", "model": "llama", "target_model": "human", "recognition_score": 0.7620701243454712, "ground_truth": 0}, {"key": "31792608", "model": "llama", "target_model": "claude", "recognition_score": 0.852935471048903, "ground_truth": 0}, {"key": "31792608", "model": "llama", "target_model": "gpt4", "recognition_score": 0.771843496908211, "ground_truth": 0}, {"key": "31792608", "model": "llama", "target_model": "gpt35", "recognition_score": 0.6460136644363517, "ground_truth": 0}, {"key": "33132662", "model": "llama", "target_model": "llama", "recognition_score": 0.8568122947235562, "ground_truth": 1}, {"key": "33132662", "model": "llama", "target_model": "human", "recognition_score": 0.8104789040144992, "ground_truth": 0}, {"key": "33132662", "model": "llama", "target_model": "claude", "recognition_score": 0.6424324756962229, "ground_truth": 0}, {"key": "33132662", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7799928914706988, "ground_truth": 0}, {"key": "33132662", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8333245924853947, "ground_truth": 0}, {"key": "37577457", "model": "llama", "target_model": "llama", "recognition_score": 0.8210441233035214, "ground_truth": 1}, {"key": "37577457", "model": "llama", "target_model": "human", "recognition_score": 0.602061600825605, "ground_truth": 0}, {"key": "37577457", "model": "llama", "target_model": "claude", "recognition_score": 0.8019358227802952, "ground_truth": 0}, {"key": "37577457", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8679338494990942, "ground_truth": 0}, {"key": "37577457", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7969253514890559, "ground_truth": 0}, {"key": "38701278", "model": "llama", "target_model": "llama", "recognition_score": 0.8832359731343812, "ground_truth": 1}, {"key": "38701278", "model": "llama", "target_model": "human", "recognition_score": 0.9178933801619465, "ground_truth": 0}, {"key": "38701278", "model": "llama", "target_model": "claude", "recognition_score": 0.9437636568868074, "ground_truth": 0}, {"key": "38701278", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8799743728725615, "ground_truth": 0}, {"key": "38701278", "model": "llama", "target_model": "gpt35", "recognition_score": 0.8519527995523865, "ground_truth": 0}, {"key": "34570783", "model": "llama", "target_model": "llama", "recognition_score": 0.9742394418981516, "ground_truth": 1}, {"key": "34570783", "model": "llama", "target_model": "human", "recognition_score": 0.9053222954378549, "ground_truth": 0}, {"key": "34570783", "model": "llama", "target_model": "claude", "recognition_score": 0.924687698215222, "ground_truth": 0}, {"key": "34570783", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8933094041210713, "ground_truth": 0}, {"key": "34570783", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9012274150040807, "ground_truth": 0}, {"key": "39064526", "model": "llama", "target_model": "llama", "recognition_score": 0.7648916093755244, "ground_truth": 1}, {"key": "39064526", "model": "llama", "target_model": "human", "recognition_score": 0.7534666768749937, "ground_truth": 0}, {"key": "39064526", "model": "llama", "target_model": "claude", "recognition_score": 0.8019358232778848, "ground_truth": 0}, {"key": "39064526", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8548846453072003, "ground_truth": 0}, {"key": "39064526", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9207896774496938, "ground_truth": 0}, {"key": "40741545", "model": "llama", "target_model": "llama", "recognition_score": 0.6859494838787517, "ground_truth": 1}, {"key": "40741545", "model": "llama", "target_model": "human", "recognition_score": 0.8459424352759699, "ground_truth": 0}, {"key": "40741545", "model": "llama", "target_model": "claude", "recognition_score": 0.9032942145819581, "ground_truth": 0}, {"key": "40741545", "model": "llama", "target_model": "gpt4", "recognition_score": 0.7826624811257131, "ground_truth": 0}, {"key": "40741545", "model": "llama", "target_model": "gpt35", "recognition_score": 0.7106283188526848, "ground_truth": 0}, {"key": "36929751", "model": "llama", "target_model": "llama", "recognition_score": 0.963506234260532, "ground_truth": 1}, {"key": "36929751", "model": "llama", "target_model": "human", "recognition_score": 0.9235923166471153, "ground_truth": 0}, {"key": "36929751", "model": "llama", "target_model": "claude", "recognition_score": 0.9793540695496467, "ground_truth": 0}, {"key": "36929751", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9666631760348643, "ground_truth": 0}, {"key": "36929751", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9686195670266068, "ground_truth": 0}, {"key": "23984730", "model": "llama", "target_model": "llama", "recognition_score": 0.26588048759491106, "ground_truth": 1}, {"key": "23984730", "model": "llama", "target_model": "human", "recognition_score": 0.3451052843230858, "ground_truth": 0}, {"key": "23984730", "model": "llama", "target_model": "claude", "recognition_score": 0.42250462744645156, "ground_truth": 0}, {"key": "23984730", "model": "llama", "target_model": "gpt4", "recognition_score": 0.3702253692121777, "ground_truth": 0}, {"key": "23984730", "model": "llama", "target_model": "gpt35", "recognition_score": 0.23651622982615295, "ground_truth": 0}, {"key": "36007415", "model": "llama", "target_model": "llama", "recognition_score": 0.9837225404928222, "ground_truth": 1}, {"key": "36007415", "model": "llama", "target_model": "human", "recognition_score": 0.9726235140424151, "ground_truth": 0}, {"key": "36007415", "model": "llama", "target_model": "claude", "recognition_score": 0.9711290913541394, "ground_truth": 0}, {"key": "36007415", "model": "llama", "target_model": "gpt4", "recognition_score": 0.9549844675902206, "ground_truth": 0}, {"key": "36007415", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9678992948927202, "ground_truth": 0}, {"key": "38875041", "model": "llama", "target_model": "llama", "recognition_score": 0.9039745087993382, "ground_truth": 1}, {"key": "38875041", "model": "llama", "target_model": "human", "recognition_score": 0.9597620592150052, "ground_truth": 0}, {"key": "38875041", "model": "llama", "target_model": "claude", "recognition_score": 0.9362850088412894, "ground_truth": 0}, {"key": "38875041", "model": "llama", "target_model": "gpt4", "recognition_score": 0.8947894632462181, "ground_truth": 0}, {"key": "38875041", "model": "llama", "target_model": "gpt35", "recognition_score": 0.9032942079216794, "ground_truth": 0}]