[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3014196196053687, "2": 0.2524423432261291, "4": 0.2245564176068414, "1": 0.11299119315369308, "5": 0.10857886539974267}, "score": 2.963288994456574}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3210482036474702, "4": 0.25976772828343936, "2": 0.22743549937979354, "5": 0.1178678143266399, "1": 0.07386623179841653}, "score": 3.1203371415639607}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30528973575491725, "4": 0.2747818689187708, "2": 0.2137539268726464, "5": 0.13484018724114882, "1": 0.07132245958301726}, "score": 3.188065620604476}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29933764356921433, "4": 0.2639978288295847, "2": 0.21898673976873745, "5": 0.13477031768036254, "1": 0.08289697560127975}, "score": 3.148759334381407}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28371178433911426, "4": 0.22297056761987918, "2": 0.2208197325807704, "5": 0.18795246384742723, "1": 0.08453554349359488}, "score": 3.208986746412371}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2633520365073129, "2": 0.26031121057671613, "4": 0.1928651382252602, "1": 0.1682109722866264, "5": 0.11524303877663607}, "score": 2.826615008423766}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2815165615269375, "2": 0.26390251642328505, "4": 0.19406727532642282, "1": 0.1493384608164919, "5": 0.11116110872735609}, "score": 2.853807996753794}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27674468849709183, "2": 0.2538302607793947, "4": 0.19913450063011626, "1": 0.1457165911888549, "5": 0.12455887291850769}, "score": 2.90298733977839}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28098938111184496, "2": 0.24881321613854274, "4": 0.21499910793556262, "1": 0.1332802533073579, "5": 0.12190332090536433}, "score": 2.9434311942661955}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2818316421443967, "2": 0.26170077710518164, "4": 0.20016633161401046, "1": 0.14388458411208513, "5": 0.11239992598715857}, "score": 2.875494154150995}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2975929695875479, "3": 0.2505549052097838, "1": 0.22247187274412308, "4": 0.14504905259664974, "5": 0.08431639912291336}, "score": 2.571138788303829}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27085290268202217, "2": 0.26588430724004014, "4": 0.18539106872779082, "1": 0.16741979135299295, "5": 0.11044200913393999}, "score": 2.8055492679305303}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.26502839706530557, "3": 0.26205716814402197, "4": 0.19217212964700467, "1": 0.16445916116394094, "5": 0.11627386096079317}, "score": 2.830771561224602}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.28071465169130777, "3": 0.2616707879145388, "1": 0.17864421085349766, "4": 0.176338135976715, "5": 0.10261980845669758}, "score": 2.7435714984687456}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2869147057217883, "3": 0.25426750420311744, "1": 0.20125073711639713, "4": 0.16114145455822054, "5": 0.0964130030549366}, "score": 2.664547055567763}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31674526772094724, "2": 0.23991230937763258, "4": 0.22779303579780624, "5": 0.11584598333045282, "1": 0.09968183651555552}, "score": 3.0202094559125108}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3238403925989478, "2": 0.2632000472525568, "4": 0.21796506093024282, "1": 0.10052948614873343, "5": 0.09445312493321371}, "score": 2.942611609005632}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33171901791093455, "2": 0.2559524996400094, "4": 0.22311675042877102, "5": 0.0959181361258845, "1": 0.0932794735646077}, "score": 2.9724411867166656}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3295827231328945, "2": 0.257235055307053, "4": 0.21989265137736153, "5": 0.09825695912031748, "1": 0.09501763243737996}, "score": 2.9691357871327133}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3305476019354016, "2": 0.2558066994481339, "4": 0.21784654196775646, "1": 0.09829363546084063, "5": 0.0974887102490714}, "score": 2.96042932687592}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28389012485311377, "2": 0.26688802248313775, "4": 0.19406168626937623, "1": 0.15196151211022899, "5": 0.1031794576012557}, "score": 2.8296062837741554}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2980142424984057, "2": 0.26360935173273936, "4": 0.20422515352706005, "1": 0.12664504840278654, "5": 0.10749395129722766}, "score": 2.902312410661933}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2917612640476026, "2": 0.24257204983795785, "4": 0.2222843635260213, "5": 0.12375811548584437, "1": 0.11961007522523621}, "score": 2.988008224742982}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29086457445883784, "4": 0.23750136693695095, "2": 0.22870886868989662, "5": 0.13522045938633737, "1": 0.10769145917076231}, "score": 3.063851346072227}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.292997823007853, "2": 0.25389321849050145, "4": 0.21347313192868164, "1": 0.12585082525159794, "5": 0.1137689774888143}, "score": 2.9354151830163198}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2866238070130739, "2": 0.26279865771870586, "4": 0.19916204283605307, "1": 0.14579012375614014, "5": 0.10561773254284712}, "score": 2.8560175032212394}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.291954911881863, "2": 0.25478849738603904, "4": 0.21762227554656363, "1": 0.1282460108369758, "5": 0.10738188281610728}, "score": 2.921105015492085}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3056740319140999, "2": 0.2654329267924602, "4": 0.21123403279581654, "1": 0.11838244927433862, "5": 0.09926755484924701}, "score": 2.907570484883247}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29373226200817976, "2": 0.24390028628029603, "4": 0.2295062538412194, "5": 0.12139774202430696, "1": 0.11145480573290519}, "score": 3.005491887649176}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3085184906980406, "2": 0.2480084402822769, "4": 0.22908744326377117, "5": 0.11016439817751808, "1": 0.10421505274202666}, "score": 2.992977650490618}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3115054639929881, "2": 0.25772501391707014, "4": 0.2232969453072683, "1": 0.10728792184860592, "5": 0.10017419083569142}, "score": 2.951343960222782}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3084331662844239, "2": 0.2673934258684574, "4": 0.2124969167786218, "1": 0.11444780631021233, "5": 0.097216969443644}, "score": 2.910640770305536}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3024607989974006, "2": 0.2398016393716195, "4": 0.23843248273249573, "5": 0.12491484672747785, "1": 0.09437740389521217}, "score": 3.0597064949567914}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2867014925906947, "2": 0.23684394846800114, "4": 0.23493807739667488, "5": 0.1290176193291892, "1": 0.11248825081405582}, "score": 3.0311531965380136}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29707480595246977, "2": 0.2612396483575288, "4": 0.2103299691015054, "1": 0.1223996950902185, "5": 0.10894430398049694}, "score": 2.922178637546326}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26472651626062327, "2": 0.2452966216824138, "4": 0.20947302643697877, "1": 0.15344268028985442, "5": 0.12704694692557222}, "score": 2.91138367892946}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2664229221262559, "2": 0.25062319072493233, "4": 0.20584621872795672, "1": 0.1545485488447529, "5": 0.12255095209563073}, "score": 2.8912269461029867}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26471365086456466, "2": 0.257765119049334, "4": 0.19844182397942348, "1": 0.16390299828820679, "5": 0.1151660821331139}, "score": 2.843201253565384}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26984806516016985, "2": 0.2650176636325779, "4": 0.19792575368491927, "1": 0.1609594675565906, "5": 0.1062368440021838}, "score": 2.8234606881111204}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2626698916532597, "2": 0.2601475002946108, "4": 0.19453513296983863, "1": 0.17007735772372068, "5": 0.11256186470421643}, "score": 2.8193551558367598}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2646888483574943, "2": 0.25130360226872817, "4": 0.20923400755258884, "1": 0.15171128578139886, "5": 0.12304409400568977}, "score": 2.9005942163212097}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2640873656734548, "2": 0.2553371372946008, "4": 0.20341649546662952, "1": 0.15176287638847075, "5": 0.12537673428676208}, "score": 2.8953050438402244}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27114924232527615, "2": 0.2515442652397425, "4": 0.2168310717079098, "1": 0.13602887494633717, "5": 0.12442918749896648}, "score": 2.942086426293295}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.271476907085772, "4": 0.23844559687968175, "2": 0.22932838660176114, "5": 0.14565298521133713, "1": 0.11508194950609728}, "score": 3.070260277607836}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2678727833940126, "2": 0.24231188538747855, "4": 0.22477223013975894, "5": 0.1356684821983193, "1": 0.12936246610545712}, "score": 2.9950723170529834}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3222202374502232, "3": 0.30592622526585433, "2": 0.17387950841786046, "5": 0.15702742615575455, "1": 0.04093454301050363}, "score": 3.380531084413508}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.33147655362078543, "3": 0.30534545621602993, "2": 0.1636976582235964, "5": 0.1617553452142997, "1": 0.03771690788704629}, "score": 3.415859129710337}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.32665261899069425, "3": 0.3027936586528281, "5": 0.16784260730289505, "2": 0.16497873370904467, "1": 0.037721305934907114}, "score": 3.421921160967315}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3571115432232801, "3": 0.29221685448434603, "5": 0.17993347135419013, "2": 0.14117295628406848, "1": 0.029554348162968296}, "score": 3.5167024273959107}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31940678515054016, "4": 0.28513398111635346, "2": 0.20135744841347294, "5": 0.14360507238163045, "1": 0.05048768670779566}, "score": 3.2700137412567383}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29500422520974157, "4": 0.27162191446768097, "2": 0.20796162739040627, "5": 0.14662212207399, "1": 0.07877481025794239}, "score": 3.199357961005836}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2974611056066433, "3": 0.29261822673757215, "2": 0.18295662062601203, "5": 0.16934119398126338, "1": 0.05760664231270423}, "score": 3.3379790672071157}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31109025496956755, "4": 0.2888430551921302, "2": 0.19583241715506328, "5": 0.14618211084419172, "1": 0.05803808766958023}, "score": 3.2693024745949555}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2935185907948165, "3": 0.2890611562311666, "2": 0.17956056832058234, "5": 0.17864776590866635, "1": 0.05919280391325437}, "score": 3.352874691605334}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30323390730067096, "4": 0.25598347176624164, "2": 0.2227312925992076, "5": 0.13198282216205826, "1": 0.08604781059958415}, "score": 3.125124791821151}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.295366417553636, "2": 0.25735109448186355, "4": 0.20972878142822482, "1": 0.12473082045724533, "5": 0.11281113841266448}, "score": 2.928537483339396}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2969225941220323, "2": 0.2712146514105435, "4": 0.2015496149227597, "1": 0.1300994137009455, "5": 0.10020395700933485}, "score": 2.870542785482906}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2964203294571905, "2": 0.25467926749892145, "4": 0.21002477059637606, "1": 0.12401168300909966, "5": 0.11485252096759868}, "score": 2.9370264593231807}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29047577409169656, "2": 0.255400596457693, "4": 0.21046420243767314, "1": 0.1323460097485524, "5": 0.11130289614166065}, "score": 2.912976463180886}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27979426884555814, "2": 0.2528415173929766, "4": 0.2100624524201796, "1": 0.1380129579561672, "5": 0.11927565930392267}, "score": 2.9197452828481953}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2892775127171271, "2": 0.23922601606652177, "4": 0.22723328545107283, "5": 0.1269969764864816, "1": 0.11724752272780692}, "score": 3.0075063171690792}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28618683849690973, "4": 0.2358234139516134, "2": 0.22966783719718598, "5": 0.1359185730674714, "1": 0.11238852921248971}, "score": 3.0532164524975745}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3024662433407815, "2": 0.2527985885480854, "4": 0.21859040437880806, "1": 0.11426300801245569, "5": 0.11186375739449578}, "score": 2.9609926125271513}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2779145740788847, "4": 0.25339617650034424, "2": 0.2205444537734359, "5": 0.1520564873301645, "1": 0.09607658933683368}, "score": 3.1448132157767983}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28726119212528617, "2": 0.24326864775281232, "4": 0.22197908794339194, "1": 0.12581266048427872, "5": 0.12166303059924415}, "score": 2.970410725305066}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27087237770584377, "2": 0.25267881567939526, "4": 0.1947250724720094, "1": 0.15848952122427354, "5": 0.12322194730980668}, "score": 2.871509532949894}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28410789528336367, "2": 0.2648085942020877, "4": 0.2038491131967138, "1": 0.13492402995715438, "5": 0.11230038375645386}, "score": 2.8937921662562474}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29452405453207525, "2": 0.27389115391597235, "4": 0.19037640264377384, "1": 0.1425635804763761, "5": 0.0986323280915973}, "score": 2.8286206050850913}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2773988546458945, "2": 0.25286134094501334, "4": 0.21182229223664292, "1": 0.13509388470396794, "5": 0.12281075324023243}, "score": 2.9343938437355286}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2906404914927651, "2": 0.2514535495848224, "4": 0.21458421648983195, "1": 0.12666375525790283, "5": 0.11664783972204323}, "score": 2.9430982584255627}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.25863370104562516, "2": 0.24825307237512617, "4": 0.20382644643562162, "1": 0.1565204823390243, "5": 0.1327465244991733}, "score": 2.9080236397041292}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27103413679561805, "2": 0.24941178336496322, "4": 0.2125825915523658, "1": 0.13936827347432895, "5": 0.12758014801436113}, "score": 2.9395931638751582}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2665545942189902, "3": 0.2635300436113083, "4": 0.1888673995186953, "1": 0.1673444693955956, "5": 0.11368559264713798}, "score": 2.814991740042401}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27835452721936793, "4": 0.2393920247273139, "2": 0.2278707264685198, "5": 0.14455971560712633, "1": 0.10980840550147247}, "score": 3.0810251014751677}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2705753665755091, "2": 0.2557791505501381, "4": 0.20943327222935468, "1": 0.14723559324214308, "5": 0.11695912081272346}, "score": 2.8930993064227573}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2839523887844846, "2": 0.26962332139353345, "4": 0.19968335341435672, "1": 0.1445294190659235, "5": 0.10219975484421494}, "score": 2.8453988850821803}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29021408622386036, "2": 0.23621707202363298, "4": 0.23486838160899265, "5": 0.13229641575859294, "1": 0.1063936270516018}, "score": 3.050457412631028}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30186493401774683, "2": 0.24875432901984815, "4": 0.2241939395846541, "5": 0.11882823879562014, "1": 0.1063468347877748}, "score": 3.000402423298424}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29217247011522807, "4": 0.24630102802279072, "2": 0.22777166981312877, "5": 0.1389718895161777, "1": 0.09477221532203023}, "score": 3.1069298536570207}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2924665435142826, "2": 0.2478096172518627, "4": 0.21982537451992423, "5": 0.12029182661465028, "1": 0.11959361801116752}, "score": 2.973411828294689}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.2820249603729952, "2": 0.26530151694687576, "3": 0.2111423560020676, "4": 0.13861481605441633, "5": 0.10289706082100282}, "score": 2.51504814537799}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.25779721280445045, "3": 0.23556754296532811, "1": 0.20514650429305556, "4": 0.17664878203371287, "5": 0.12482581418563408}, "score": 2.758206769159192}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.25842398246069537, "3": 0.23538883857492945, "1": 0.218492781850787, "4": 0.171003081871762, "5": 0.11667559354429932}, "score": 2.7089401468431173}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.24853609313209674, "3": 0.24200528844154254, "1": 0.19137659320432757, "4": 0.1864714937698149, "5": 0.13159358598427567}, "score": 2.8183663083297152}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.24797191132944674, "3": 0.23853047477073602, "4": 0.1903799436777945, "1": 0.1874687713955792, "5": 0.13563554588947124}, "score": 2.8387394280338785}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "human", "scores": {"2": 0.26740612735784414, "3": 0.24143391191668875, "1": 0.20757519903007182, "4": 0.17318269521481533, "5": 0.11039427537178748}, "score": 2.7114124721235764}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.26313204514659727, "3": 0.25492397895906105, "1": 0.18773231259363246, "4": 0.18206471102821406, "5": 0.11213987533252982}, "score": 2.767746147712842}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2729591578320306, "3": 0.2524262126757735, "1": 0.19733018249102674, "4": 0.16755694757108072, "5": 0.10971291373362836}, "score": 2.7193591588821304}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.27384443207060105, "3": 0.2498995354716252, "1": 0.1995194407562817, "4": 0.1733514399986199, "5": 0.10337791786653648}, "score": 2.7072218442392675}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.25107147987854067, "2": 0.24976132927995953, "4": 0.188810086960562, "1": 0.18034227606934028, "5": 0.13000671188171292}, "score": 2.838376317578873}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31217798159170984, "2": 0.2573245372192913, "4": 0.22145855890072705, "1": 0.10776921892611142, "5": 0.10126298847381064}, "score": 2.9511212325613676}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2818194390984897, "4": 0.2601819200857187, "2": 0.20512207279931857, "5": 0.15918745642122778, "1": 0.09367899385341297}, "score": 3.186078655117823}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29760707582862156, "4": 0.2712168482581172, "2": 0.20643363466557632, "5": 0.14928645528787807, "1": 0.07544661190089061}, "score": 3.2124648920249315}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31174547791885354, "4": 0.25308352661932115, "2": 0.22971811698967093, "5": 0.12220100598443599, "1": 0.08324297816877133}, "score": 3.1012823660986473}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3103537509507774, "2": 0.24521284266671767, "4": 0.23861731566763697, "5": 0.11094788415968715, "1": 0.09486200711964582}, "score": 3.0255763856401554}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26225336513641795, "2": 0.2559404189671325, "4": 0.19120083714518935, "1": 0.1718761533815936, "5": 0.11871794610989395}, "score": 2.8289420742278764}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26508845930487535, "2": 0.26244472252050255, "4": 0.1940934761771095, "1": 0.16055167911238433, "5": 0.11780946063455197}, "score": 2.846162439536481}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28457259244047584, "2": 0.24133726112913617, "4": 0.21767020124806508, "1": 0.13003757913891204, "5": 0.12637133538557893}, "score": 2.9690001106630906}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2737691899594076, "2": 0.2562222108176053, "4": 0.20126538870337046, "1": 0.15120269368778397, "5": 0.11752836150657786}, "score": 2.877693026842313}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2823773731442443, "2": 0.24218383317204495, "4": 0.21517733002361217, "1": 0.1332625548649213, "5": 0.12697970607209424}, "score": 2.960427039357308}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28933531613853747, "2": 0.2609124939755597, "4": 0.19942566871002856, "1": 0.13549237680320034, "5": 0.1148199534109501}, "score": 2.8971668686489376}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2937790279067582, "2": 0.24522243067631028, "4": 0.22059004502372428, "1": 0.12057494128325708, "5": 0.11981954017082659}, "score": 2.9738564457222316}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2937705084384818, "2": 0.24040090782930282, "4": 0.2247575754681013, "5": 0.12673987770695577, "1": 0.11431946788285362}, "score": 3.0091975945555527}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29234370412357286, "4": 0.2473660637542325, "2": 0.22105847935544756, "5": 0.14574499412025335, "1": 0.09347343506576977}, "score": 3.1308524459308793}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30032351560972464, "2": 0.2373752397131905, "4": 0.23430520935955396, "5": 0.13084123988653082, "1": 0.09714490006573293}, "score": 3.0643232857903673}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28172758093503775, "2": 0.24932368174596778, "4": 0.2225250498761231, "5": 0.12499153049692241, "1": 0.12141937702955742}, "score": 2.980345423881045}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28882780468143315, "4": 0.24176923068367012, "2": 0.23257728513677284, "5": 0.14091788981054196, "1": 0.09589750635361537}, "score": 3.0992337329143664}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30596058271008614, "2": 0.24177036700172472, "4": 0.23924051360236628, "5": 0.11990961839791944, "1": 0.09310807162636622}, "score": 3.051073794123906}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2948930590678354, "4": 0.24115432445322862, "2": 0.23390381386228287, "5": 0.13547722960221803, "1": 0.09456464540477301}, "score": 3.089076296071645}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28417375912681486, "4": 0.2424587224000867, "2": 0.22256181405099984, "5": 0.14967024073557025, "1": 0.10112023748905148}, "score": 3.116998696287378}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2901636223822242, "2": 0.26532260925588125, "4": 0.19301287161410924, "1": 0.15504316762974268, "5": 0.09643847873553295}, "score": 2.8104772361841106}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2979212169739377, "2": 0.2597960185294253, "4": 0.20243856928794013, "1": 0.1367549008905641, "5": 0.10307476296788656}, "score": 2.8752804625698785}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31861942930027976, "2": 0.2844674338448154, "4": 0.19124594674313974, "1": 0.12369784758722956, "5": 0.0819510140385526}, "score": 2.823281606820378}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3009320461560058, "2": 0.2559971160489037, "4": 0.21904236946531108, "1": 0.11539045968877762, "5": 0.10862366342067666}, "score": 2.949510936603467}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3001764531703105, "2": 0.24406036176514506, "4": 0.22021276199332648, "5": 0.11970886607859496, "1": 0.11582791276659389}, "score": 2.9839140873723555}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29999844130183007, "2": 0.2865462284492478, "4": 0.18644354378780226, "1": 0.139712491515317, "5": 0.08728386985906428}, "score": 2.7950369104526143}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29294324259774973, "2": 0.2773144827479275, "4": 0.1987961204080768, "1": 0.13595896047478204, "5": 0.09497657468985891}, "score": 2.8395151618887104}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2958706539678304, "2": 0.25564771384888135, "4": 0.21260663600315846, "1": 0.1217580987164648, "5": 0.11410331147127235}, "score": 2.941648554901603}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3008587480376354, "2": 0.2643371519243187, "4": 0.21633245738979195, "1": 0.11694036207423615, "5": 0.10151915287761037}, "score": 2.9211519308267757}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29527917919962987, "2": 0.2819584385314029, "4": 0.1977848411480555, "1": 0.1360837872808292, "5": 0.08887900754042087}, "score": 2.8214142096562562}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2974805899471657, "2": 0.2855909033612432, "4": 0.17396892285514984, "1": 0.15800732283060737, "5": 0.08494140611663865}, "score": 2.742243388146508}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3047323587223017, "3": 0.29432929129504504, "1": 0.18123836144977004, "4": 0.14994611241477387, "5": 0.069740595424155}, "score": 2.62221320437043}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.31164903878788836, "3": 0.29656534410076824, "1": 0.17687896391657398, "4": 0.15011351566391076, "5": 0.06478221974020917}, "score": 2.6142667771687194}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.28937614423199887, "3": 0.2890231182859583, "4": 0.17313682519460533, "1": 0.16283572637684407, "5": 0.0856163079966815}, "score": 2.7293186290722597}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.30368645738672834, "3": 0.2892429171954595, "1": 0.17585480429855488, "4": 0.15707069317141822, "5": 0.07413424556991179}, "score": 2.6499393088346648}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28257406097808735, "2": 0.25931641069253014, "4": 0.2047983996615301, "1": 0.14236142621804723, "5": 0.11093444918441954}, "score": 2.8826262445687036}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28173913200265144, "2": 0.25221380970289714, "4": 0.22056836208803218, "1": 0.1241893949505504, "5": 0.1212785394444365}, "score": 2.9625324381540716}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2839008844927396, "2": 0.2575075342713958, "4": 0.21222352426847982, "1": 0.13027639110822026, "5": 0.11608015907686123}, "score": 2.926322678145463}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28565511141303346, "2": 0.25389202519517884, "4": 0.2166155837209166, "1": 0.12495137716915124, "5": 0.11887520899629246}, "score": 2.950570693607464}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2787069799879479, "2": 0.252716467627932, "4": 0.21545722091057995, "1": 0.12983247673989687, "5": 0.12327440173209105}, "score": 2.9496239759343306}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3018722694247683, "3": 0.30034057446987833, "4": 0.17038436900258042, "1": 0.1507582527896482, "5": 0.07663466185120461}, "score": 2.720262155999713}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.31453094921641683, "3": 0.3126432859035977, "4": 0.17344027069337084, "1": 0.13158573008169341, "5": 0.06779010761937204}, "score": 2.7313154820041454}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.329583975549622, "2": 0.27235642076845573, "4": 0.21842377088185674, "5": 0.09203454346128027, "1": 0.08759179060377978}, "score": 2.9549524279334523}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30471919456875257, "2": 0.24755121229856664, "4": 0.23604431881456975, "5": 0.1142675329171655, "1": 0.09740842237982658}, "score": 3.022211534580441}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.3060870317454335, "3": 0.30411136877777617, "4": 0.1719824400694443, "1": 0.14370521437802522, "5": 0.07409864744133947}, "score": 2.7266780932847237}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2893760863567758, "4": 0.24326020647719226, "2": 0.2243507283669508, "5": 0.1419896232152496, "1": 0.10100597555299014}, "score": 3.100878526706666}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2907795380901891, "4": 0.2508776020552852, "2": 0.2213606958470211, "5": 0.14013200608741483, "1": 0.09683268371537256}, "score": 3.1161175800147127}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28204859505495383, "4": 0.25603492961540725, "2": 0.20962270647162287, "5": 0.1575557208670723, "1": 0.09472324969495964}, "score": 3.1720797119745208}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28374472518945537, "4": 0.2616273541688457, "2": 0.20788766859389524, "5": 0.16109540691103, "1": 0.08562389393762225}, "score": 3.2046869999598657}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2956434829747065, "4": 0.2732795541117781, "2": 0.2087424674445882, "5": 0.1453659533253321, "1": 0.07695628851069423}, "score": 3.2013588836743074}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2802179740276669, "2": 0.2571787784338663, "4": 0.19623618886622876, "1": 0.15457289215818154, "5": 0.1117834233306343}, "score": 2.8534768986527146}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2726143281561302, "2": 0.2710795659237996, "4": 0.18487959567084242, "1": 0.16844494811363253, "5": 0.1029669619472474}, "score": 2.7828408868503187}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2775249333283529, "2": 0.25699388195316086, "4": 0.19341870190341792, "1": 0.15905395415732132, "5": 0.11299736264126474}, "score": 2.8443098984799047}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28045948582856284, "2": 0.2704926643276297, "4": 0.18689294737197185, "1": 0.1626363910034777, "5": 0.09950507809392892}, "score": 2.7901348380279445}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.281569942127324, "2": 0.24612894837454322, "4": 0.21385971848634985, "1": 0.13443015614268328, "5": 0.12399743488529227}, "score": 2.946864594329287}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3277187198326576, "2": 0.2718080935811542, "4": 0.21366754499435817, "1": 0.10373458595678904, "5": 0.0830613821946481}, "score": 2.9005120814984724}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3443274103449816, "2": 0.2648532976656552, "4": 0.22980678231789203, "5": 0.0842840615549519, "1": 0.07672263525503967}, "score": 2.980076221437897}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.34539737955324595, "2": 0.25741492546801015, "4": 0.23565198550392594, "5": 0.08842951367122237, "1": 0.07309854621820643}, "score": 3.0088990630160897}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3199514223078252, "4": 0.25624762932165546, "2": 0.23318177018732408, "5": 0.11313893525206492, "1": 0.07746991589383577}, "score": 3.0944048727734317}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3266979941907067, "2": 0.24802443734257473, "4": 0.23683726956282733, "5": 0.09700945800751178, "1": 0.09142164613052016}, "score": 2.99998845586809}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3125525074750371, "2": 0.2828652056307346, "4": 0.18812897765903694, "1": 0.1319516119153741, "5": 0.08447963327515919}, "score": 2.810315629543452}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31699106234423824, "2": 0.2774750943260034, "4": 0.19737535653977156, "1": 0.12201576759719827, "5": 0.08612418609230695}, "score": 2.8481142842907547}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31986440735552746, "2": 0.29006292406609907, "4": 0.18966923354240545, "1": 0.12298655973836053, "5": 0.07740452790754801}, "score": 2.8084398805471658}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30499222332343506, "2": 0.25454198145353, "4": 0.2223027694333153, "5": 0.11097930905003558, "1": 0.10716878043990663}, "score": 2.975381477490411}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30627864095816926, "2": 0.2732726948810536, "4": 0.20412520977763685, "1": 0.11975619634756718, "5": 0.09655737381545604}, "score": 2.8844537277475726}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27792760857806564, "2": 0.24254134216028536, "4": 0.22552772017253303, "5": 0.12900181563881713, "1": 0.12499088054265366}, "score": 2.9910081525950916}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28155347076750153, "2": 0.252477258416527, "4": 0.21572841508057708, "1": 0.13053305359990233, "5": 0.11969708730569799}, "score": 2.9415785981002642}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2823402994290932, "4": 0.23496472088530893, "2": 0.23110803356891593, "5": 0.13876687668314247, "1": 0.11280914167318573}, "score": 3.0557727668077366}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2807444090214977, "4": 0.24903572971007298, "2": 0.22380077952010266, "5": 0.14744076162106384, "1": 0.09897100010418103}, "score": 3.122175367550246}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2799370283098021, "4": 0.23499663126107062, "2": 0.23007981695980342, "5": 0.1417956560071065, "1": 0.11317816732140307}, "score": 3.0621525810192054}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2587383912870798, "3": 0.25643663036542713, "1": 0.1861629711350944, "4": 0.18112495985207072, "5": 0.11752555261230427}, "score": 2.785109261404518}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2750723018647689, "3": 0.2500461695427012, "1": 0.210991759662693, "4": 0.1623411165213956, "5": 0.1015342803583585}, "score": 2.6683490895444626}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.26129231957971844, "3": 0.25818512825537554, "1": 0.18959106799536526, "4": 0.17752301792916925, "5": 0.11339737909416195}, "score": 2.763840702214381}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2594912748163093, "3": 0.2533670629522697, "1": 0.19625873769973518, "4": 0.1754838259767182, "5": 0.11538864807278172}, "score": 2.7542498036984533}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.28198483107640127, "3": 0.2594844243370808, "1": 0.20139174250699693, "4": 0.160996508591483, "5": 0.0961275234255234}, "score": 2.668478276451208}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29832952942124297, "2": 0.2609795571037543, "4": 0.2112163110039045, "1": 0.12711924449677242, "5": 0.10234014077953209}, "score": 2.9006770350487647}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29289543816150587, "2": 0.23348631773827008, "4": 0.2332424053297997, "5": 0.13292792698645675, "1": 0.10743704831640946}, "score": 3.050738396126545}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28770259173544116, "4": 0.2329877737428164, "2": 0.2300244664147805, "5": 0.13615482794586012, "1": 0.11311962408407247}, "score": 3.04903424050631}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2829957214512516, "4": 0.25299635436068446, "2": 0.21210363063405266, "5": 0.159062940959606, "1": 0.0928308740515054}, "score": 3.173358674089136}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29283417084462726, "4": 0.23742810906585857, "2": 0.23506424951830432, "5": 0.1307408969837492, "1": 0.103919886375991}, "score": 3.0560065913305388}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2676166052900097, "3": 0.2657376858980503, "4": 0.18747760138265646, "1": 0.17617536288018626, "5": 0.10297840221221471}, "score": 2.7734638256985757}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29353041983237904, "2": 0.23947338395946693, "4": 0.23033357377441235, "5": 0.12664717605747194, "1": 0.11000820775706897}, "score": 3.0241383011437213}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2942107299093772, "2": 0.25626005763306164, "4": 0.21955864648273848, "1": 0.11926067922188294, "5": 0.11070106707206019}, "score": 2.946178889865016}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28449443108528605, "2": 0.23629274447009752, "4": 0.23183028620250337, "5": 0.13682723600587396, "1": 0.11054643721648984}, "score": 3.048099565714774}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28694084484209836, "2": 0.24979542402831986, "4": 0.22546785051087653, "5": 0.12301664593026378, "1": 0.11476870922230133}, "score": 2.9921682174653204}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2897829455097328, "2": 0.24599939559098696, "4": 0.2236195966486768, "1": 0.1207601055616151, "5": 0.11982925792958424}, "score": 2.975758294920868}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27384925177501873, "2": 0.25776151036292816, "4": 0.20486316715470412, "1": 0.14660191893759625, "5": 0.11691045255520811}, "score": 2.8877171858406387}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27223982271450764, "2": 0.25017082361481563, "4": 0.2068564716257905, "1": 0.14431877655660608, "5": 0.1264006063763041}, "score": 2.920848239171888}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2744097916256806, "2": 0.2342754779149863, "4": 0.23202619597610274, "5": 0.1361991671758742, "1": 0.12307878502525946}, "score": 3.023991736249666}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2801280665062348, "2": 0.2377547497115342, "4": 0.23449636319016737, "5": 0.13904424321308698, "1": 0.10856903945705462}, "score": 3.0576924558719254}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.28636664891371966, "3": 0.248004149773373, "1": 0.21247785666004587, "4": 0.15954033575214824, "5": 0.09359877342670492}, "score": 2.635411059453241}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2782057030173497, "3": 0.24434356274903474, "1": 0.19048414809070227, "4": 0.18255757066621367, "5": 0.10439440467885375}, "score": 2.732168467592791}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2574947364649706, "3": 0.2549413143790279, "4": 0.19590026525497825, "1": 0.17089722953873138, "5": 0.12075465940366602}, "score": 2.838118479134036}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2789601887485121, "3": 0.2545136016048039, "1": 0.18599739699823625, "4": 0.17643668362000592, "5": 0.10408126403615818}, "score": 2.7336413349624973}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2562877095850762, "3": 0.24956177481203345, "4": 0.18914455783616274, "1": 0.17893950341761827, "5": 0.12604864186245837}, "score": 2.8270720448638746}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2666430783719444, "2": 0.2604330126483072, "4": 0.18709903563334696, "1": 0.173415314434064, "5": 0.11239091187456514}, "score": 2.8046135744879854}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2851430200068205, "2": 0.25818517989240636, "4": 0.20180945880210877, "1": 0.14268759341641285, "5": 0.11215923234547437}, "score": 2.882565734712163}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2741489793776594, "2": 0.27234933959357144, "1": 0.18878658156797645, "4": 0.16793556748821095, "5": 0.09675989290999172}, "score": 2.711527185243005}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2766381346358145, "2": 0.25997661352316476, "4": 0.19417091550900445, "1": 0.15556814684301248, "5": 0.11362887768796621}, "score": 2.8503131723271684}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27328859981472475, "2": 0.25658058299171704, "4": 0.20176690167505418, "1": 0.15090673228331083, "5": 0.11744068281175997}, "score": 2.8782522108501625}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3062837864825596, "2": 0.25733601414958496, "4": 0.2180785412751548, "1": 0.11386178254453791, "5": 0.10443244248864465}, "score": 2.941883415029748}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3046231622141187, "2": 0.26540176679598243, "4": 0.2118883063473682, "1": 0.11940211077467919, "5": 0.09867904155748895}, "score": 2.905039868171273}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2933106771938678, "4": 0.2477519834379623, "2": 0.22295732356151504, "5": 0.14115728695558477, "1": 0.09481679717749776}, "score": 3.1174763362639}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3054875359674495, "4": 0.2491400726303474, "2": 0.23219663538097715, "5": 0.12868959687619033, "1": 0.08447947276400844}, "score": 3.105364389980192}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2952305802465372, "4": 0.24062444029248475, "2": 0.23678053015069309, "5": 0.1262530819044826, "1": 0.10110470661337495}, "score": 3.054141021346112}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32797040609128225, "2": 0.25292304663999254, "4": 0.23871803342480077, "5": 0.09946673622578407, "1": 0.08091480240688646}, "score": 3.0228990141480643}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3104030079994967, "4": 0.2762957027540968, "2": 0.20845353839693523, "5": 0.1414592060401956, "1": 0.06337909523917107}, "score": 3.224004502705463}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3528825136386351, "4": 0.26375643404657967, "2": 0.23246076985453284, "5": 0.10351787250258467, "1": 0.04737323368350927}, "score": 3.143586259417079}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3177744895906512, "4": 0.2994693212186487, "2": 0.19486914440684383, "5": 0.1470495020869156, "1": 0.040830905360193674}, "score": 3.3170394745630043}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.33108262910511177, "4": 0.2649613268661001, "2": 0.23251603234721432, "5": 0.10637323334809493, "1": 0.06505752503045355}, "score": 3.115077776003701}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3229926859931226, "2": 0.2589592928755053, "4": 0.22870825117678487, "5": 0.09757838258533072, "1": 0.09175123790370514}, "score": 2.981403058915518}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.32747826255091844, "2": 0.2575500265200647, "4": 0.23232716656588856, "5": 0.09293659430633446, "1": 0.0897005660013753}, "score": 2.981249058197749}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3353463837514417, "2": 0.27078869107138354, "4": 0.2204971741111078, "5": 0.08733179312656741, "1": 0.08602655081233991}, "score": 2.9523185191224255}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3271014537788346, "2": 0.2577605566471042, "4": 0.23678491063102025, "5": 0.10083424993058389, "1": 0.0775104510078746}, "score": 3.025672166910867}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3373780052297686, "4": 0.25628942671848287, "2": 0.22872766933159874, "5": 0.10764919856722378, "1": 0.06994813081202622}, "score": 3.1029646722719844}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28326390198886214, "2": 0.2629900973959835, "4": 0.20116592780552042, "1": 0.1401373031773593, "5": 0.11242836676604014}, "score": 2.8827562689411232}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29024804325839626, "2": 0.27146099900512805, "4": 0.20233729436896644, "1": 0.13189712715153123, "5": 0.10404290675191626}, "score": 2.8751661531461794}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2939246314853936, "2": 0.25537832649666625, "4": 0.21186675840234423, "1": 0.12628068384496907, "5": 0.11253380652894253}, "score": 2.9289935558516915}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2946425653960755, "2": 0.25441380094244365, "4": 0.2160772059951436, "1": 0.12140082556611521, "5": 0.11344910009051987}, "score": 2.945759059016975}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2964402792166648, "2": 0.26094881552264215, "4": 0.208047720523728, "1": 0.12621331844675607, "5": 0.1083315875904546}, "score": 2.9113338225860477}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27055910548462864, "2": 0.24544777095056522, "4": 0.21678959589118044, "1": 0.13892963458976304, "5": 0.12825897716410817}, "score": 2.949999764289802}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2739585394279138, "4": 0.23313618760709487, "2": 0.23237835387875855, "5": 0.1416590733563333, "1": 0.11885559620490786}, "score": 3.0463653559847743}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26985419078077455, "2": 0.25075480244511655, "4": 0.2152684338681795, "1": 0.1410327706007692, "5": 0.12307783732226345}, "score": 2.9286029106010982}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2779998791510633, "2": 0.2356170409056817, "4": 0.22937978485215746, "5": 0.13692007740365716, "1": 0.12006970858320065}, "score": 3.0274638525994364}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2787708111947594, "2": 0.2484902424527691, "4": 0.2167068630929878, "1": 0.13479371583841315, "5": 0.12122650998687931}, "score": 2.941081510315037}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27262313374113906, "2": 0.2534838920953391, "4": 0.20463366467933194, "1": 0.14544893735213457, "5": 0.12379479044859024}, "score": 2.9078400427696223}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27460845386914223, "2": 0.2465328570652367, "4": 0.2166187463315259, "1": 0.135675021576759, "5": 0.12655375757724627}, "score": 2.951842823660768}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27728395210411977, "4": 0.23705912414333333, "2": 0.22591794971239007, "5": 0.1433170600418389, "1": 0.11641109853398984}, "score": 3.0649537999521477}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27210017229185257, "2": 0.23656577294771283, "4": 0.22854688584562832, "5": 0.13798600665735836, "1": 0.12479033125079933}, "score": 3.0183726627054654}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2536407711048958, "4": 0.22527459469933447, "2": 0.21904061713336467, "5": 0.16225858704854126, "1": 0.13977269262304937}, "score": 3.0512064186531207}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30897175933466564, "2": 0.2605055793937093, "4": 0.22435535003955823, "1": 0.10336023141790837, "5": 0.1027944002213209}, "score": 2.9627176355274725}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3019435800762628, "2": 0.24083878770742884, "4": 0.23616657421204273, "5": 0.12648612001957554, "1": 0.09455501921385223}, "score": 3.059190575213812}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30815690312231275, "2": 0.26882230335079416, "4": 0.20881704357246292, "1": 0.11437474327261354, "5": 0.09981689713760465}, "score": 2.9108779687244732}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30476828878543066, "4": 0.25027847025626715, "2": 0.23377337869666012, "5": 0.1262935146142398, "1": 0.08487731653375316}, "score": 3.0993383848568232}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2881528530159339, "4": 0.2522457672170523, "2": 0.22555726623910077, "5": 0.14414039342862622, "1": 0.08989418702960278}, "score": 3.135182202477354}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26280002427527904, "2": 0.23624962497900498, "4": 0.22654864248678686, "5": 0.13802361296779955, "1": 0.13636772251897525}, "score": 2.993610732131011}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2792330894204657, "2": 0.2643932502197757, "4": 0.20163412223282998, "1": 0.14768026703929266, "5": 0.10704684891684492}, "score": 2.8559722466308077}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2658549818182783, "2": 0.24287812613334955, "4": 0.22301188789426435, "1": 0.13870806586994902, "5": 0.12953574665338222}, "score": 2.9617886956809722}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2656725881398063, "4": 0.2579834096010504, "2": 0.21316836063031327, "5": 0.16151181194752318, "1": 0.10165461896991568}, "score": 3.1645309503730505}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.25524653422304105, "2": 0.24992797565697772, "4": 0.198992190250522, "1": 0.16767149512549198, "5": 0.12814936260553422}, "score": 2.870018332303726}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29766663296298745, "4": 0.2403026279927734, "2": 0.22668316168231428, "5": 0.12879462468434, "1": 0.10653973125247342}, "score": 3.0581300217359213}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29556405424255927, "2": 0.2417450066204015, "4": 0.22942153577221908, "5": 0.12290054843143086, "1": 0.1103500933869704}, "score": 3.0127776789697553}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32915385274576325, "2": 0.2563002936205524, "4": 0.21823275549657692, "1": 0.09983158128316602, "5": 0.09646708663066703}, "score": 2.955202826137806}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3090446234658602, "2": 0.2526032002262794, "4": 0.22215072189986174, "1": 0.11069713725393386, "5": 0.10548640467602494}, "score": 2.9591253243510343}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3006056818936753, "4": 0.2381995050354295, "2": 0.23683092240905532, "5": 0.12511359429338473, "1": 0.0992363202647556}, "score": 3.053123873148392}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3083408660511739, "4": 0.2777282392684137, "2": 0.20587073647260992, "5": 0.13901643714514383, "1": 0.06903359560863405}, "score": 3.2118253306964704}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3085689375951912, "3": 0.2961620524423941, "2": 0.1814498812089077, "5": 0.1607753065919809, "1": 0.05303294260142775}, "score": 3.342607511786404}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31196012619403474, "4": 0.27764837611167253, "2": 0.212791897052592, "5": 0.12854864319664955, "1": 0.06904298481608845}, "score": 3.183869261741603}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3031147294776468, "4": 0.2818305430031357, "2": 0.20965570368243389, "5": 0.13733436585051365, "1": 0.06805316098806445}, "score": 3.2107396719192307}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.30212474016007057, "3": 0.2926573816757166, "2": 0.1908667000657084, "5": 0.16025292990659648, "1": 0.054087979943835816}, "score": 3.3235912627352437}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28552271239584587, "2": 0.28551834393176506, "4": 0.18268120398671162, "1": 0.15336045705101561, "5": 0.09290788133507635}, "score": 2.776255605134981}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2983333778969951, "2": 0.2795967478857592, "4": 0.19358532647754143, "1": 0.1290129489759034, "5": 0.09945910741968403}, "score": 2.854879082724027}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3108238580755378, "2": 0.2736786694566781, "4": 0.20561057744654987, "1": 0.11226137737893695, "5": 0.0976156939326027}, "score": 2.9026395846567468}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30542458147397, "2": 0.26389425640379094, "4": 0.2129374326182708, "1": 0.11040836258006967, "5": 0.1073268529683307}, "score": 2.942879670671056}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3031857272608064, "2": 0.2562906056525573, "4": 0.22262200290268525, "5": 0.11262240549380051, "1": 0.10527076854948447}, "score": 2.981034510119083}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31123836917931835, "2": 0.27847393908213575, "4": 0.19556833910488589, "1": 0.12488352201220211, "5": 0.08979577982909075}, "score": 2.8469127843922406}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29043746286377486, "2": 0.2766092827830222, "4": 0.19541194699878536, "1": 0.14255526926190856, "5": 0.09496174050747215}, "score": 2.82361132088796}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3198598333272067, "2": 0.2777077436806522, "4": 0.20492904125163802, "1": 0.10340902896245217, "5": 0.0940812037454785}, "score": 2.9085644448479457}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31172533981144784, "2": 0.24709786654473936, "4": 0.23372901271984786, "5": 0.10906146026692527, "1": 0.09837409222374793}, "score": 3.0080059801620576}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3065538946730385, "2": 0.2632577996781335, "4": 0.2229752723484907, "1": 0.10488223811343957, "5": 0.10231691220411822}, "score": 2.9545861903725776}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30344700396198826, "2": 0.284225995064078, "1": 0.1759287667932871, "4": 0.160040511327513, "5": 0.07632262177762072}, "score": 2.676590874223957}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2994844448012375, "2": 0.28089296210269576, "1": 0.18452251323349073, "4": 0.15902405482456508, "5": 0.07604863569629099}, "score": 2.6611740574279454}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2995161918349495, "3": 0.28939715370270463, "1": 0.2086549809406878, "4": 0.13977873093379725, "5": 0.06261541407224405}, "score": 2.548166448719475}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3060562103332209, "2": 0.28295746301603986, "4": 0.1834893777654141, "1": 0.14231604862894093, "5": 0.08516478944424147}, "score": 2.786225952306452}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.31755857165809853, "3": 0.28315659362725143, "1": 0.19385990886986196, "4": 0.1431097443570183, "5": 0.0622933811752786}, "score": 2.5624085776800034}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2851135377428111, "2": 0.24962614509394856, "4": 0.20691338566930245, "1": 0.15049494250135723, "5": 0.10783591637258849}, "score": 2.8719671304941587}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2949759946562426, "2": 0.23506370887115216, "4": 0.22779417476583266, "5": 0.12380419921019274, "1": 0.11834632446374659}, "score": 3.003646272262248}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2922086433061026, "2": 0.25450021454144234, "4": 0.20526258850185683, "1": 0.13813547119872385, "5": 0.10988048542399866}, "score": 2.8942510702887483}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2841679052076725, "2": 0.2407799338999414, "4": 0.2262121054847979, "5": 0.12452484808243058, "1": 0.12430674724497827}, "score": 2.985868253704054}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2904398154167519, "4": 0.24026925227574242, "2": 0.22774586474482367, "5": 0.13567408542233986, "1": 0.10586279606971151}, "score": 3.072146556832985}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26431653443056136, "2": 0.2600008964728639, "4": 0.19062205136295576, "1": 0.1686509811199245, "5": 0.11639453441323357}, "score": 2.8261056526788524}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26665262436502235, "2": 0.24566128059727402, "4": 0.20480990965501886, "1": 0.1538165531405736, "5": 0.12904519334061798}, "score": 2.909604604247619}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2767142205841777, "2": 0.245188420683823, "4": 0.21459792885937118, "1": 0.13589126976885033, "5": 0.1275932894463787}, "score": 2.9528128458266014}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26498705586006127, "2": 0.2374766918268204, "4": 0.21325797412324254, "1": 0.14601604004301647, "5": 0.13824415748209998}, "score": 2.9602367982294684}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2731201146929462, "2": 0.24972439231091523, "4": 0.2048343244513427, "1": 0.1477410795226235, "5": 0.12456243535321572}, "score": 2.908751032922555}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28208365587430395, "2": 0.24631056005701887, "4": 0.21569728771617433, "1": 0.13714424826884772, "5": 0.11875435061269635}, "score": 2.9326062653193206}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27744118894113806, "2": 0.25344800131734546, "4": 0.21205069617434177, "1": 0.14036160408073928, "5": 0.11668989884896512}, "score": 2.911258520272737}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2908937496387669, "2": 0.26495372258514094, "4": 0.21129673636149918, "1": 0.13369649642059192, "5": 0.09914940748298974}, "score": 2.8772476221856667}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28673902427246983, "2": 0.261541868318652, "4": 0.20743639840648445, "1": 0.14262458222344723, "5": 0.10164885531642119}, "score": 2.8639418148154157}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2980946277790754, "2": 0.2550837643798211, "4": 0.2206067663828686, "1": 0.11928202879419339, "5": 0.10692371956680215}, "score": 2.9408058452900603}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2692724194814564, "2": 0.2529797330462191, "4": 0.19634817355257142, "1": 0.16060293538842346, "5": 0.12078055197822696}, "score": 2.863721467806261}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28384677814065445, "2": 0.2557118127652067, "4": 0.20748342956878402, "1": 0.14062748993159133, "5": 0.11231791521465294}, "score": 2.8951511489604984}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2832704737876208, "2": 0.2537278609297292, "4": 0.2066139919002538, "1": 0.13477983280067055, "5": 0.12159632888454536}, "score": 2.926518277238934}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2827873152790976, "2": 0.2506355718163646, "4": 0.21457181388055768, "1": 0.13413331306105564, "5": 0.117861508567254}, "score": 2.9313919142425293}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2792539489113377, "2": 0.25052318696659137, "4": 0.2069089370793331, "1": 0.1406179135256073, "5": 0.12268350130478596}, "score": 2.920515931149551}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28614580224663877, "2": 0.2628176324667733, "4": 0.18964122146535403, "1": 0.16001314673981493, "5": 0.10136388651787338}, "score": 2.8095215807874987}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2867503220125902, "2": 0.24803063803101658, "4": 0.20656569119551993, "1": 0.1434828877531744, "5": 0.11514846307044019}, "score": 2.9018640450104543}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29679850641382705, "2": 0.2841561693155352, "1": 0.17120727876972197, "4": 0.1675212617419238, "5": 0.08029668030838429}, "score": 2.7015378953855347}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29694275585065616, "2": 0.23769084982334143, "4": 0.22924217533713234, "5": 0.12296362488371096, "1": 0.11314768122978759}, "score": 3.0111833572309363}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2917505274306406, "2": 0.2595986745252955, "4": 0.19447901767899672, "1": 0.15517082067872637, "5": 0.09898271896433623}, "score": 2.8225009020132186}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28330653641427145, "2": 0.26568589866989806, "4": 0.19708318115433426, "1": 0.14584677422286005, "5": 0.10806253409789836}, "score": 2.8558266287573986}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2856662807462487, "2": 0.2666936386925706, "4": 0.203131058475908, "1": 0.14012762002426657, "5": 0.10436344588984138}, "score": 2.8649066457550947}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29616018662734106, "2": 0.25814805553284326, "4": 0.21181525985327887, "1": 0.12434578569232867, "5": 0.10952129212479511}, "score": 2.9240175014173597}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2880413594372157, "2": 0.23349047383171492, "4": 0.2327621179379539, "5": 0.1317826505832201, "1": 0.11391337361652612}, "score": 3.0350105490061443}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2884355254458284, "2": 0.25840845164605514, "4": 0.20623584220046062, "1": 0.13781126153161757, "5": 0.10909901659264565}, "score": 2.8904018153712987}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3288910625228207, "3": 0.29089933485237784, "1": 0.19698744169839583, "4": 0.12797527471635564, "5": 0.055223190288507265}, "score": 2.5155442297478343}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.33094340503218517, "3": 0.2921908191225041, "1": 0.18199482980021028, "4": 0.1339008203120756, "5": 0.060956224718031714}, "score": 2.5608741008198246}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32576770922117587, "2": 0.30705303311835697, "4": 0.1625923062538345, "1": 0.13980982118066423, "5": 0.06476536559945158}, "score": 2.7054468966658023}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3263326235981791, "2": 0.32391537032817175, "4": 0.15913405798768654, "1": 0.1295548416297041, "5": 0.06105477908491927}, "score": 2.6982160495029253}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30726150074742203, "2": 0.28860474249955276, "4": 0.1824145016212052, "1": 0.13921663972105114, "5": 0.08249224418000882}, "score": 2.7803586900888586}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3053949567263905, "4": 0.27100446018246316, "2": 0.21251391721197238, "5": 0.13594457677767477, "1": 0.07513202347356682}, "score": 3.1801174625740685}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30374726150178605, "4": 0.26789807177835795, "2": 0.2161636109332967, "5": 0.1359979046976085, "1": 0.07618627123814943}, "score": 3.1713589066876913}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30818919965806885, "4": 0.2853422619834547, "2": 0.20150108761840826, "5": 0.13826992859484774, "1": 0.06669038429142322}, "score": 3.22700188327815}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31123544355239857, "4": 0.27177210857182427, "2": 0.22372042708831957, "5": 0.12599849708482644, "1": 0.06726613927995508}, "score": 3.1655176193453087}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3022723036953958, "4": 0.27285744490928715, "2": 0.20942223538673155, "5": 0.14028602567587284, "1": 0.07515605453703589}, "score": 3.1936963015418987}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29748585540020694, "4": 0.24429946271610625, "2": 0.23606839656303313, "5": 0.1181359735151716, "1": 0.1039948396314697}, "score": 3.036513898869874}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30610380577437735, "4": 0.25247076983436434, "2": 0.23603032180147956, "5": 0.11879923636242108, "1": 0.08658791697466221}, "score": 3.080863729614623}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3098167454521546, "4": 0.25637675940244375, "2": 0.230542096957406, "5": 0.12002140225235237, "1": 0.08323301458061719}, "score": 3.099412430059267}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30731247965897984, "4": 0.2774129746069459, "2": 0.21338133687658015, "5": 0.13612559864217816, "1": 0.06575927192471236}, "score": 3.2047659985636994}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2881802864733528, "4": 0.2872063017564129, "2": 0.1944243378675672, "5": 0.1635728209053874, "1": 0.06660811913048065}, "score": 3.2867136995297006}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3134874661785818, "2": 0.2772866972288339, "4": 0.19680657212056735, "1": 0.12601554583480395, "5": 0.08638722265895918}, "score": 2.8402605934822676}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3163342409077228, "4": 0.23753697106031718, "2": 0.23596190652846227, "5": 0.11693778941456988, "1": 0.09321333389321572}, "score": 3.0490247481161386}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32020095369135143, "2": 0.24744016098583346, "4": 0.22847707543608553, "5": 0.10799906600469376, "1": 0.09586472460055309}, "score": 3.005305692863306}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3156528011437167, "2": 0.2399569612131322, "4": 0.23592606663696927, "5": 0.11564960566940956, "1": 0.09280043051782896}, "score": 3.0416680446972664}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3108442487894357, "2": 0.251032190266432, "4": 0.2196074597952503, "5": 0.11180824200538467, "1": 0.10669224539776466}, "score": 2.9788069318408805}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2752109732471617, "2": 0.2548763890948414, "4": 0.21356082335016555, "1": 0.13549814890139694, "5": 0.12084622613490091}, "score": 2.929380063361448}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29144461244807496, "4": 0.24082243530891373, "2": 0.24063370451177105, "5": 0.12524026081556885, "1": 0.10185224442283376}, "score": 3.0469650802443304}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.294299330098242, "4": 0.24555134721300548, "2": 0.23648743533713695, "5": 0.12315322095840087, "1": 0.10050112073029104}, "score": 3.0543685225786334}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28966578097883366, "4": 0.25712891630301776, "2": 0.225376892585191, "5": 0.13654190706640604, "1": 0.09127908477912505}, "score": 3.1222785753900077}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29370600351772824, "2": 0.24115584373025845, "4": 0.2410551339690302, "5": 0.12527812666954885, "1": 0.09879325952369723}, "score": 3.052869639541301}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26913125004254235, "2": 0.25790834735094353, "4": 0.19995328794271036, "1": 0.14831688192582776, "5": 0.12466969239276983}, "score": 2.8947483996214456}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2801773733848179, "4": 0.26002525969826273, "2": 0.20832017081453985, "5": 0.1607466268355952, "1": 0.090719087270916}, "score": 3.1917623698278184}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2801321003794363, "4": 0.2509996335027062, "2": 0.2199793061518738, "5": 0.15062210422262953, "1": 0.0982550136517871}, "score": 3.1357561161288747}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26844455108768567, "4": 0.2639512109294952, "2": 0.19897651028372904, "5": 0.17741680219116882, "1": 0.09119961531026019}, "score": 3.237411759581511}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2651013694272024, "3": 0.2635048249928648, "2": 0.20074934277674547, "5": 0.1756747333086658, "1": 0.09495976532381156}, "score": 3.225784212372601}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3263885291647765, "2": 0.30284444140739913, "4": 0.18111490769574887, "1": 0.12584287173077593, "5": 0.06379632450055914}, "score": 2.7541741944062834}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3391688883287206, "2": 0.24699240297831132, "4": 0.23605926089286247, "5": 0.10310147309911963, "1": 0.07466797452416282}, "score": 3.045934314415731}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3548782166686502, "4": 0.2554956231534448, "2": 0.23683854848753608, "5": 0.08522844835492148, "1": 0.06754920389929522}, "score": 3.054016101547076}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3391712625192485, "4": 0.26960442146115415, "2": 0.2262179192106149, "5": 0.10601628124647196, "1": 0.05898298302402697}, "score": 3.1374540790919383}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.33951936291050694, "4": 0.24704869896163373, "2": 0.24138705414207984, "5": 0.09456008749871093, "1": 0.07747340211849046}, "score": 3.039835469480016}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.33386615495109206, "3": 0.2683774751758531, "1": 0.2104478920940182, "4": 0.131144462002501, "5": 0.05615067368038133}, "score": 2.488677048104145}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.29269100994077796, "3": 0.2915649164626582, "4": 0.18156655468738742, "1": 0.1489966286206072, "5": 0.085172096896661}, "score": 2.7612243816511266}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3155276696170277, "3": 0.29139434258832775, "1": 0.1638607167691989, "4": 0.15967549172542592, "5": 0.0695333628908175}, "score": 2.6554902148163095}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30314855896910703, "2": 0.29008850874426945, "4": 0.1843619378420798, "1": 0.13787753711753606, "5": 0.08451255295261996}, "score": 2.7875411440370703}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2920614072564775, "3": 0.2758297090172098, "4": 0.17264439848685098, "1": 0.1685637268161933, "5": 0.09088806359567679}, "score": 2.7252281766084154}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "human", "scores": {"2": 0.262084790425213, "3": 0.2567044900059319, "4": 0.18570243465873956, "1": 0.18103251915756108, "5": 0.11446338371666964}, "score": 2.7904767790277027}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.26301410948801107, "3": 0.25738882491788795, "4": 0.18363305112062392, "1": 0.17899505486061704, "5": 0.11695561209173012}, "score": 2.7965373403726907}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2605028701497717, "3": 0.25772880250262076, "4": 0.18709140214841724, "1": 0.17570080537358818, "5": 0.11896495797904078}, "score": 2.813114751225079}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26663043978956635, "2": 0.23539392302875456, "4": 0.22266167767852008, "5": 0.1454169711889146, "1": 0.12988779715740037}, "score": 3.018326271152426}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2589790781212677, "2": 0.2553913000451777, "4": 0.1881586291223899, "1": 0.17269963626473842, "5": 0.1247580022643733}, "score": 2.8368818827674485}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30938912194810986, "2": 0.29615396732872473, "4": 0.18857214749326826, "1": 0.12400095646244919, "5": 0.08187619415777118}, "score": 2.8081671952069223}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3270416650979358, "2": 0.2818291620368583, "4": 0.21058365371125787, "1": 0.09805105172325615, "5": 0.08248587602457211}, "score": 2.897623260716887}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3400309962792664, "2": 0.27475532627226373, "4": 0.2149405286604389, "1": 0.09007397516382443, "5": 0.08019202563807086}, "score": 2.9204207345051816}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3207391830446593, "2": 0.25257445561769293, "4": 0.23176033037899219, "5": 0.10345449756485064, "1": 0.09146508172756976}, "score": 3.0031647268536226}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31864973144885056, "2": 0.26469342751418046, "4": 0.21789830845574326, "1": 0.1021110839457473, "5": 0.09663848709289237}, "score": 2.942259169788944}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28114034104510116, "2": 0.2735147850219619, "4": 0.1890978638094478, "1": 0.15056022631369145, "5": 0.10567364023878037}, "score": 2.8258076171277082}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29144414613706815, "2": 0.26723306465743335, "4": 0.20969283699561386, "1": 0.1226157251302467, "5": 0.10900447963812496}, "score": 2.915236455126241}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28531849396298326, "2": 0.2716060250504546, "4": 0.19668219032690037, "1": 0.14145858362105837, "5": 0.10492517519997477}, "score": 2.8520079377978234}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28373365936095807, "2": 0.25449443745214245, "4": 0.21388437793348114, "5": 0.12449094458246877, "1": 0.12338463364766378}, "score": 2.9616021036103866}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27615996439940865, "4": 0.23146319568894877, "2": 0.22922997997780384, "5": 0.1467164157437237, "1": 0.11641696580120982}, "score": 3.062832962483277}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.282938052799855, "4": 0.2425568895586066, "2": 0.2202531967682272, "5": 0.14955957059489583, "1": 0.10468117256076481}, "score": 3.1120617347293673}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29909539788726447, "4": 0.25594745742543246, "2": 0.22624452400224515, "5": 0.13058414117840886, "1": 0.08811698256273257}, "score": 3.1146385686477345}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28196920954947996, "4": 0.25131247344246355, "2": 0.21289716995671734, "5": 0.1555442378562954, "1": 0.09826606796261628}, "score": 3.152973301692223}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29043214790683647, "4": 0.2606825488158417, "2": 0.21142790781437698, "5": 0.14840812486253932, "1": 0.08904040709313267}, "score": 3.167991565534741}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29320023718999455, "4": 0.26151987357241846, "2": 0.2160525529924201, "5": 0.1448945996277195, "1": 0.08432416502088672}, "score": 3.1666096179040917}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2940152330177963, "2": 0.2705156571812799, "4": 0.20119282548813802, "1": 0.13738200166816394, "5": 0.09687995928495821}, "score": 2.8496709303231142}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2974074484632117, "2": 0.24465236363549744, "4": 0.22720663254991266, "1": 0.11830727661992214, "5": 0.11241259417265616}, "score": 2.970764503945018}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2808784122241039, "2": 0.26911892411355626, "4": 0.1901076667902198, "1": 0.16068169831479798, "5": 0.0991983696307758}, "score": 2.798019069950151}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2854967881105407, "2": 0.2582122907595907, "4": 0.220175527163567, "1": 0.12010300853021505, "5": 0.11600332784132371}, "score": 2.9537634562343174}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.300429848954142, "2": 0.2480618918603584, "4": 0.2274143716033016, "1": 0.11279839147423941, "5": 0.11128030394692925}, "score": 2.976315944876344}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2540856662817903, "2": 0.25059484684493794, "4": 0.1899786085004047, "1": 0.17832615034583646, "5": 0.12699747177565568}, "score": 2.8367235869762784}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2596252068656115, "2": 0.2530813754184875, "4": 0.19080387708927607, "1": 0.1741352992554388, "5": 0.1223422541557852}, "score": 2.834134423205085}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.25949950082010237, "2": 0.25432556010115553, "4": 0.19005026294326632, "1": 0.17070082775733036, "5": 0.12541111730099935}, "score": 2.8451433104369874}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.26685343603667405, "3": 0.2637893001457773, "4": 0.1899158879196157, "1": 0.16856129951600377, "5": 0.11086677763221758}, "score": 2.8076708503781465}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.24888045455304406, "2": 0.2446782002892487, "4": 0.1959067104797285, "1": 0.17515236967969305, "5": 0.1353650738107855}, "score": 2.87165171199318}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2947981482688342, "2": 0.2818886342641475, "4": 0.19946470013249526, "1": 0.13544733307684775, "5": 0.08838944649553433}, "score": 2.8234582205003047}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3103413991172927, "2": 0.25399718365436846, "4": 0.2371278575458478, "5": 0.10809600624760331, "1": 0.09042498201844576}, "score": 3.0184729545809996}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31740760845162186, "4": 0.2465804178404539, "2": 0.23993711759298483, "5": 0.11321640536436609, "1": 0.08284416218951021}, "score": 3.0673887494854433}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3140518435045835, "4": 0.25073569565714804, "2": 0.23658493555139656, "5": 0.11469799905838277, "1": 0.08390700304845557}, "score": 3.0757344579064356}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3125707923315512, "4": 0.2510101757086981, "2": 0.23389181490440758, "5": 0.12053620677765427, "1": 0.08197246342545633}, "score": 3.094247595504913}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2827329970532651, "2": 0.23850547808682918, "4": 0.22319400682007917, "1": 0.1319015325891485, "5": 0.12365692274085216}, "score": 2.9681990208336115}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.293355439818509, "4": 0.24204282637277114, "2": 0.23202032578760273, "5": 0.12793670878073457, "1": 0.10463961191955236}, "score": 3.0566169823362856}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2871089266103763, "2": 0.23656203523802827, "4": 0.23581558474423575, "5": 0.130889633924547, "1": 0.10961779001337738}, "score": 3.0417974893452313}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2883373010344284, "4": 0.2663974266725853, "2": 0.20553741366230432, "5": 0.1594221760950396, "1": 0.08029886440779227}, "score": 3.219108130292021}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29344102408216205, "2": 0.24377000516503575, "4": 0.22775666015466176, "5": 0.12110770564718275, "1": 0.1139180441605899}, "score": 2.9983659672422647}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2874820946966986, "2": 0.24228513563194543, "4": 0.23055422379063883, "5": 0.13004059604574408, "1": 0.10962719562325546}, "score": 3.0290962019103858}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2713609026475979, "2": 0.2370362253379712, "4": 0.22854759434207264, "1": 0.135819171404977, "5": 0.1272233596359587}, "score": 2.9743194181251535}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2887081103647535, "2": 0.24082424148395168, "4": 0.23230405116282565, "5": 0.1268193051183778, "1": 0.11133555720253194}, "score": 3.02244750158203}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2826055697424673, "4": 0.23413994191704038, "2": 0.23304078449108684, "5": 0.1393196702974279, "1": 0.11088439576290672}, "score": 3.0579702652001837}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29049244787966255, "2": 0.25985047748200796, "4": 0.21295406368119285, "1": 0.1285031321802946, "5": 0.10819046935981855}, "score": 2.912477437021939}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2731720670792761, "2": 0.22319481031995, "4": 0.2137410592735673, "5": 0.16119196420452725, "1": 0.12865125308982917}, "score": 3.0556303885067986}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28877911241843696, "2": 0.23281279576711053, "4": 0.2259599969552061, "5": 0.14485842396291218, "1": 0.10757289157836004}, "score": 3.067719402242583}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28260537191863777, "4": 0.24541895707366332, "2": 0.22024740418532504, "5": 0.16126650047731095, "1": 0.09045006034290846}, "score": 3.1668063857930546}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2706242639619952, "4": 0.23604582950304434, "2": 0.2174821501711057, "5": 0.1678550449009035, "1": 0.10797117344842347}, "score": 3.1383344016852517}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2734918380941357, "2": 0.22248219567850863, "4": 0.21621000462206774, "5": 0.15933752945721988, "1": 0.128436584795086}, "score": 3.0555320221359588}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2657917955990798, "2": 0.22719811246094468, "4": 0.22364587349501755, "5": 0.149595888067399, "1": 0.13375076146847292}, "score": 3.028138508594824}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2748559326120788, "4": 0.2405681648175737, "2": 0.21840112151120647, "5": 0.1543638192706399, "1": 0.11179331660136983}, "score": 3.107309942148918}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.289060202330925, "4": 0.23704900193484313, "2": 0.2323013796815983, "5": 0.13274234304950974, "1": 0.10882991808087839}, "score": 3.052573374082652}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2725141607974123, "4": 0.23334682799847525, "2": 0.22971159308778827, "5": 0.14057209361434939, "1": 0.12384238631337778}, "score": 3.0370951294564117}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2586098819786437, "4": 0.2406806085914345, "2": 0.20672243070823726, "5": 0.17502157971567575, "1": 0.11895253868572614}, "score": 3.146098153421957}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2669198107395686, "2": 0.25469034628801956, "4": 0.19007075146592312, "1": 0.1665013602375691, "5": 0.12180593469201119}, "score": 2.8459877372692857}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2793746406162273, "2": 0.25582688339296655, "4": 0.20385096823208432, "1": 0.14260627040273377, "5": 0.11832920098950993}, "score": 2.899468735981534}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.284501031432651, "2": 0.27732967999798297, "4": 0.18985138444902414, "1": 0.1474418674309228, "5": 0.1008652713167071}, "score": 2.8193665676363864}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.284498015737701, "2": 0.2580309345220097, "4": 0.2053465991404762, "1": 0.1377459544726473, "5": 0.11436783524674433}, "score": 2.9005583660312917}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29261298891819215, "2": 0.26975444412574817, "4": 0.19582893136906152, "1": 0.13764443181134275, "5": 0.10414590815968965}, "score": 2.859075566262856}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29207776315324474, "2": 0.2846416096621425, "4": 0.18170596050825055, "1": 0.14844500886421508, "5": 0.0931066563944333}, "score": 2.7863827324065418}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29219528967623626, "2": 0.27228531778989085, "4": 0.19999818249507842, "1": 0.13240344714232374, "5": 0.10310803056133384}, "score": 2.86912075778256}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29028473292980256, "2": 0.27024243917634405, "4": 0.19565033853851915, "1": 0.13769291871826983, "5": 0.10611931549770853}, "score": 2.862259280370778}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30782057945024927, "2": 0.26590967381291714, "4": 0.20437488500447767, "1": 0.12375765758166417, "5": 0.0981263838548154}, "score": 2.887201443224104}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2956640013444041, "2": 0.2759189267708392, "4": 0.1972020187099749, "1": 0.13516284070595985, "5": 0.09604115321962098}, "score": 2.8430379810843753}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2904565742775899, "4": 0.2522620880461644, "2": 0.2238715341286857, "5": 0.141800165180663, "1": 0.09159761909981114}, "score": 3.1287971941270585}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2725300760891249, "4": 0.27016537702227644, "2": 0.1949093110765392, "5": 0.18648533046798776, "1": 0.07589713821261675}, "score": 3.2964362350968606}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2970868377257526, "4": 0.2848627481931836, "2": 0.1939296722147464, "5": 0.1657187176259726, "1": 0.05839095390692771}, "score": 3.3055919864217063}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2953964873854714, "4": 0.29025434170927294, "2": 0.19285422236735833, "5": 0.16355497608407935, "1": 0.057928313906635824}, "score": 3.3086570421894907}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28207313435016745, "4": 0.2722431168362918, "2": 0.20113768609187122, "5": 0.17116140136685826, "1": 0.07337408287941731}, "score": 3.26668288881768}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2852100935326636, "3": 0.27096944866800016, "1": 0.19155733800643668, "4": 0.16380955105729364, "5": 0.08844383156848823}, "score": 2.6723692544534106}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27370431434945064, "2": 0.27336051150490404, "1": 0.18349895616092743, "4": 0.16743882806548638, "5": 0.10198540134599134}, "score": 2.731047982579751}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28458943963662037, "2": 0.258021851992968, "4": 0.18949248731902793, "1": 0.15402309812359558, "5": 0.11386297809953125}, "score": 2.8511488852089357}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28082726892197696, "2": 0.27069089985832484, "4": 0.18926812849449173, "1": 0.15270730942881588, "5": 0.10649754987136215}, "score": 2.8261561721464012}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27678271582970926, "2": 0.27174678059160756, "4": 0.17885746057521262, "1": 0.17621858399755408, "5": 0.09638151970964898}, "score": 2.7474332833722217}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2689138260391326, "2": 0.2460623302853834, "4": 0.2078294474121792, "1": 0.1478985963270111, "5": 0.1292849236203405}, "score": 2.9245389509752435}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2672858216713427, "4": 0.23833548429094314, "2": 0.2183704819832716, "5": 0.15636028739891655, "1": 0.11963091311526798}, "score": 3.093425340183904}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2819481472362138, "4": 0.2360118413508016, "2": 0.2314849311034857, "5": 0.1385995276833747, "1": 0.11194262676100734}, "score": 3.0578414597429573}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2806811082946885, "4": 0.24828343558254995, "2": 0.22053406637428835, "5": 0.1601024750017433, "1": 0.09038572801391445}, "score": 3.167185067808739}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2710846080506174, "2": 0.23534501325345086, "4": 0.22736577834446461, "5": 0.13979813356816254, "1": 0.12639493111648836}, "score": 3.0188273871808278}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.33978140316802424, "2": 0.2517106916479183, "4": 0.2348646237449499, "5": 0.09302493532434015, "1": 0.08060624105686383}, "score": 3.007991417368554}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.34261161197014117, "4": 0.28027861975887797, "2": 0.2108238138009929, "5": 0.11540518445085374, "1": 0.050871852726639556}, "score": 3.198523239696109}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3559708263297527, "2": 0.2562079396379189, "4": 0.23258114595175078, "5": 0.08201715879588606, "1": 0.07321170254203622}, "score": 2.9939840512820233}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.32009216789104133, "3": 0.3194231072542876, "2": 0.16584101342722543, "5": 0.15590795155775414, "1": 0.03872869813057159}, "score": 3.3886124055976086}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.34364033718395376, "4": 0.2613305755755755, "2": 0.23280713848490964, "5": 0.09909252196289657, "1": 0.06312041674767377}, "score": 3.1004685527472917}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2520994818816535, "3": 0.24720928337444426, "1": 0.20175211270318383, "4": 0.18158876163495283, "5": 0.117330199642633}, "score": 2.7606406279645945}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.24934821640333693, "2": 0.24511842938145162, "1": 0.19201987436378595, "4": 0.18394764498257268, "5": 0.12955050161520518}, "score": 2.813887616395575}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.25301755634353057, "3": 0.24819995190173127, "1": 0.1978445218370091, "4": 0.18247125960090554, "5": 0.11845243398030333}, "score": 2.7706662534982227}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.25387394872651486, "2": 0.24990700757944329, "4": 0.19159061440602004, "1": 0.18016854591767303, "5": 0.1244444683414159}, "score": 2.830232834708298}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2514341632635017, "2": 0.24514215799386202, "4": 0.18891736155305575, "1": 0.18573216799861877, "5": 0.12875918528031252}, "score": 2.8298266916644006}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28401915383901244, "4": 0.24510239916036403, "2": 0.2198932670776474, "5": 0.1494881281010365, "1": 0.10148573827282878}, "score": 3.1212152831141906}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29715458124722205, "4": 0.24292218822174072, "2": 0.22771555378746508, "5": 0.13568629663952442, "1": 0.09651042938003421}, "score": 3.0935593934963532}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3074044105692281, "4": 0.2470794337314476, "2": 0.2272545327565586, "5": 0.1304746531264969, "1": 0.08777532976494314}, "score": 3.1052247725197493}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2907461875898579, "4": 0.2880074589642919, "2": 0.18962821252377332, "5": 0.17213233645661824, "1": 0.05947758857445113}, "score": 3.323691401618128}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2984085972225605, "4": 0.26973219030209067, "2": 0.2051364523606195, "5": 0.15220478426219555, "1": 0.07450723829455592}, "score": 3.219993192066405}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2806557920005024, "2": 0.27612550178636336, "4": 0.18660757435387818, "1": 0.16313434747796426, "5": 0.09346725667590994}, "score": 2.7711457105071604}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2806548939034049, "2": 0.26167146825947185, "4": 0.2008510279884502, "1": 0.14587202248465203, "5": 0.11094312459755004}, "score": 2.869320788726338}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29201725091000424, "2": 0.28275980141189233, "4": 0.1879333876404806, "1": 0.1476933225519441, "5": 0.08958652150039707}, "score": 2.788957933643884}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2839728056952174, "2": 0.2612166080366367, "4": 0.20583804679528717, "1": 0.14135214780731045, "5": 0.10760973084295866}, "score": 2.8771352949911244}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2834724609610131, "2": 0.2801891691005355, "4": 0.19409060361491912, "1": 0.15057177472592564, "5": 0.09166670974851371}, "score": 2.796089411892252}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "human", "scores": {"2": 0.320187729665042, "3": 0.30104910138867047, "4": 0.16854759603940694, "1": 0.14956661501656568, "5": 0.06063623665575818}, "score": 2.670494917941314}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.292095901745534, "4": 0.240870339655226, "2": 0.23875713864130557, "5": 0.1237637837373356, "1": 0.10450380466108368}, "score": 3.040633526150535}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3115735976881114, "2": 0.2817249890532159, "4": 0.20816251130275523, "1": 0.11874392443842827, "5": 0.07978555547465761}, "score": 2.848519357064892}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3087148634830478, "2": 0.25785091755703343, "4": 0.23330503932386817, "1": 0.1005073921958923, "5": 0.0996109879194535}, "score": 2.973661028765692}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.296246766902983, "2": 0.27763057942115377, "4": 0.2068684075885525, "1": 0.12305409789718515, "5": 0.0961888050215089}, "score": 2.8755058302576866}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30160670851766613, "4": 0.27347810914846277, "2": 0.19951227813692837, "5": 0.15745587794417237, "1": 0.06793219524633284}, "score": 3.253016948903211}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31499317722318915, "4": 0.2550702708055936, "2": 0.2256735032827585, "5": 0.1298732505387446, "1": 0.07437678614572521}, "score": 3.1403915230839323}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3075942914124314, "4": 0.25384338414311297, "2": 0.22107360027256495, "5": 0.13788753360134526, "1": 0.07958868853986796}, "score": 3.1493693414135913}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3075808190775138, "4": 0.24687486257132985, "2": 0.2293795554724873, "5": 0.1286761495159536, "1": 0.08747395386897099}, "score": 3.09990116289328}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3024562318738176, "4": 0.27617225379126137, "2": 0.19802941474564612, "5": 0.15869466006492014, "1": 0.06463217029292362}, "score": 3.2662718843566347}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2868837206067967, "2": 0.24596053075688634, "4": 0.2135642403506751, "1": 0.13588698926127094, "5": 0.11768814405422819}, "score": 2.931204892661875}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2959103624739741, "2": 0.2536352164328325, "4": 0.21238833735429177, "1": 0.12509647992433495, "5": 0.11295813676696154}, "score": 2.934475683236253}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3097674265521672, "2": 0.25652080668009075, "4": 0.21724387685955035, "5": 0.11356150438213829, "1": 0.10289743125108858}, "score": 2.9820510557217768}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2946947806848016, "4": 0.2473233967883665, "2": 0.22617928448951286, "5": 0.1360270249662178, "1": 0.09576631249010671}, "score": 3.101666472641692}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29752173435782586, "2": 0.25358114716867736, "4": 0.21224264646945862, "1": 0.12474270787086116, "5": 0.1119012156506336}, "score": 2.9329778078779025}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2832903884019186, "2": 0.25930175972921965, "4": 0.2114664546354075, "1": 0.1392035678923133, "5": 0.10672781184997573}, "score": 2.8872120529692498}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28920797876138626, "2": 0.25153151226878534, "4": 0.22334283754479484, "1": 0.1182600104765892, "5": 0.11764648982446668}, "score": 2.970583955361483}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29545634077675953, "2": 0.24223697413439327, "4": 0.23348592081186734, "5": 0.11888865454276128, "1": 0.10992090689959132}, "score": 3.0091845448567507}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2696502311437827, "4": 0.2516333025094264, "2": 0.2064311987630591, "5": 0.17069411934662063, "1": 0.10158278471257544}, "score": 3.183426307104878}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27997499034460865, "2": 0.23625820099604547, "4": 0.235402679845567, "5": 0.13187700118557813, "1": 0.11647876468184307}, "score": 3.02994120225366}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2841048269346637, "2": 0.2645946888172242, "4": 0.19119972818354988, "1": 0.15364354536140645, "5": 0.10644121692192116}, "score": 2.8321976986940576}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27950195270198297, "2": 0.24554056774547384, "4": 0.2118945995235199, "1": 0.13613292239639235, "5": 0.1269176789421692}, "score": 2.947922905431076}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27906663236334817, "2": 0.2610874683563801, "4": 0.1982951701562209, "1": 0.14999684776600458, "5": 0.11154348099694937}, "score": 2.8602995153262443}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28708977708361527, "2": 0.23752552205423536, "4": 0.23300557468871783, "5": 0.12658100753460527, "1": 0.11578675484059335}, "score": 3.01706875198836}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28713792607641236, "2": 0.2814595883407654, "4": 0.19061953516848468, "1": 0.15069268721123188, "5": 0.09007629009473289}, "score": 2.7879241892364344}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2768013716134491, "2": 0.25168657891867663, "4": 0.21004426179946523, "1": 0.13933188916830264, "5": 0.12211808408844928}, "score": 2.9239287175559414}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28397328844939734, "2": 0.23326680376141293, "4": 0.23037070653932523, "5": 0.13558587168739747, "1": 0.11678649970335384}, "score": 3.0347032307964845}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2840255443418667, "2": 0.2401567605269005, "4": 0.23105433030247577, "5": 0.13538598933037155, "1": 0.10935987823497396}, "score": 3.0429505434833435}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27602492758676533, "4": 0.24266599192166882, "2": 0.22508353027627667, "5": 0.15022450557460693, "1": 0.10598441754168401}, "score": 3.106064401254538}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2762939897260501, "2": 0.23292883529208785, "4": 0.23136007866512887, "5": 0.14322437821686623, "1": 0.1161781720867941}, "score": 3.052524419654081}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29559819386234937, "2": 0.2538639462899843, "4": 0.21158639011368072, "1": 0.12801335302445124, "5": 0.11092228034281719}, "score": 2.9235390875973795}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29887934962039076, "2": 0.28345298707188077, "4": 0.17603252497909583, "1": 0.15798757314963432, "5": 0.08362983036413524}, "score": 2.7438595097320433}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29135958131680806, "2": 0.26800581525339395, "1": 0.17264427763581433, "4": 0.17181708969835174, "5": 0.09614527020432503}, "score": 2.7508062906577893}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29299196310999204, "2": 0.26484111469417304, "4": 0.2016788899770014, "1": 0.13841913315693494, "5": 0.10205646912660311}, "score": 2.864110758127681}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29796391214336587, "2": 0.2710721655526654, "4": 0.19352193766360487, "1": 0.1379253475471138, "5": 0.09949996366435683}, "score": 2.845596429908479}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29015558496120303, "2": 0.2602689654955206, "4": 0.204961094660201, "1": 0.13755031521153036, "5": 0.10705463150565485}, "score": 2.8836996675801094}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29465700323550403, "2": 0.25191430722386793, "4": 0.2176422324242401, "1": 0.12461387780233585, "5": 0.11116457700805328}, "score": 2.938828834101419}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29835796158016764, "2": 0.24997064200389146, "4": 0.2213565564407123, "1": 0.11637605242867717, "5": 0.11392679340234801}, "score": 2.966486994424341}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28882913329239046, "2": 0.24706796951169444, "4": 0.2288010111784563, "5": 0.11922726706082731, "1": 0.11606664813269689}, "score": 2.9880541843050294}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2896238983350922, "2": 0.2648548603047212, "4": 0.20330106902492573, "1": 0.1383138915926963, "5": 0.10388913064169693}, "score": 2.869594450349876}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2769132496511531, "2": 0.24996901719999906, "4": 0.2149740190036342, "1": 0.13272311007746435, "5": 0.12540159895842187}, "score": 2.950361036171616}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2948286909390778, "2": 0.24527152912152209, "4": 0.2355511715900039, "5": 0.12106024073030054, "1": 0.10327869170307696}, "score": 3.0258429905775355}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28520076731508953, "2": 0.24806288410991037, "4": 0.22274247399074665, "5": 0.12395545646118843, "1": 0.12002632323072408}, "score": 2.982537645136463}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2811885888671693, "4": 0.23974114504968566, "2": 0.23598019428485964, "5": 0.13657668871939133, "1": 0.10650244887133234}, "score": 3.063910129267563}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28875439398437797, "2": 0.24593782964756977, "4": 0.2241370463828402, "1": 0.12193767810189712, "5": 0.11921890952234152}, "score": 2.972761294356552}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.30849803660016817, "3": 0.3070720709965784, "4": 0.17564885832618865, "1": 0.14318989393866532, "5": 0.06557838069014676}, "score": 2.7119241195396944}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3185402940630449, "2": 0.261208249238921, "4": 0.22937033459969808, "1": 0.0977505943332105, "5": 0.09312139634477681}, "score": 2.9589033141127956}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31123021484086816, "2": 0.29904069834141683, "4": 0.19191935907476815, "1": 0.12383825004675095, "5": 0.07396144759354568}, "score": 2.7931229808292026}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31216343443671896, "2": 0.27748771973002107, "4": 0.20779738180236895, "1": 0.11336364839157224, "5": 0.08917961472386293}, "score": 2.881940626541989}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31620428586922494, "2": 0.255014799054465, "4": 0.22554607887614417, "1": 0.10162690153476663, "5": 0.10159995365392652}, "score": 2.9704771484377814}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2745574912695796, "3": 0.2594282260972585, "1": 0.19164279163393, "4": 0.16640277068207948, "5": 0.10795617729393851}, "score": 2.724468594735705}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2871607257328772, "3": 0.25826884544377887, "1": 0.2070907036098983, "4": 0.1499511356936792, "5": 0.0975108914536694}, "score": 2.6436244784908087}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.29901644712418146, "3": 0.25630731634480847, "1": 0.21542647735876058, "4": 0.1420312464734045, "5": 0.0872023324626544}, "score": 2.5865598199972477}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2832531381651005, "3": 0.26458606317096756, "1": 0.18424989827794142, "4": 0.16297162061339304, "5": 0.1049269799285088}, "score": 2.7210692149442597}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.29256901249086903, "3": 0.2516072598103496, "1": 0.2225055797860878, "4": 0.14421277007114472, "5": 0.089094667035034}, "score": 2.584817485138583}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3017722153523328, "4": 0.27352017331630135, "2": 0.1995330683994641, "5": 0.15723697762914127, "1": 0.06792267182016708}, "score": 3.2526194789185983}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3026190878922001, "4": 0.27181032241665976, "2": 0.20572258346349737, "5": 0.1540494229204547, "1": 0.06578812684616998}, "score": 3.2426128679737283}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3019640525450008, "4": 0.25972406499831685, "2": 0.21068951965749694, "5": 0.15089414718664423, "1": 0.07671530092169603}, "score": 3.197394787163367}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29989693900445086, "4": 0.2499398725117619, "2": 0.22510522937447505, "5": 0.1376933317976456, "1": 0.08735342789107983}, "score": 3.125515856655287}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30925119609148827, "4": 0.2696076836943903, "2": 0.2053607480085799, "5": 0.1517733939202327, "1": 0.06399409279247252}, "score": 3.2398086279936886}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28124280725358736, "2": 0.2516403483405379, "4": 0.20221065063891874, "1": 0.14935409737189878, "5": 0.11553478794975892}, "score": 2.882929657148476}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28535404686223076, "2": 0.2631724390156774, "4": 0.2003103430200014, "1": 0.14395046955471874, "5": 0.10719960661375247}, "score": 2.863634392423812}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29176832475562675, "2": 0.2577470245731003, "4": 0.2039409679109298, "1": 0.1366943045476309, "5": 0.10983588300182089}, "score": 2.892475649182419}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30108288099284664, "2": 0.24260569691464118, "4": 0.2324623041006769, "5": 0.12069050742434946, "1": 0.10314309325204435}, "score": 3.02495182271595}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27681878296730483, "2": 0.25161838109701185, "4": 0.2059753247776161, "1": 0.14709868366311474, "5": 0.11847630455062953}, "score": 2.8971108969811254}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3149897753152455, "2": 0.29766710922998124, "4": 0.17479732833538794, "1": 0.13839294673425534, "5": 0.07414382433321423}, "score": 2.7486297079357214}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3040774926582292, "2": 0.26199271000933416, "4": 0.21837474024918824, "1": 0.11026073497582889, "5": 0.10528480207824602}, "score": 2.9464296544534356}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3043931672082463, "2": 0.2731379773325491, "4": 0.19951437302684694, "1": 0.12371954609259962, "5": 0.09922486905414461}, "score": 2.8773858072252887}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30917982915149195, "4": 0.24451886880947724, "2": 0.2423006181467734, "5": 0.11832484655503558, "1": 0.08566475484401402}, "score": 3.0675391825872795}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29588941276193953, "2": 0.2618366612442539, "4": 0.21683725148151484, "1": 0.11712985357591993, "5": 0.10829662379744018}, "score": 2.9373334916612093}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "human", "scores": {"3": 0.301241322370887, "2": 0.2554978459750355, "4": 0.22077023034613366, "1": 0.11260043500577946, "5": 0.10987819993367104}, "score": 2.959827433507148}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3066626486258523, "2": 0.24623042363967854, "4": 0.23627955970281453, "5": 0.11188745264755062, "1": 0.09893280467033382}, "score": 3.0159585454942186}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30984924693342536, "2": 0.2582781432895751, "4": 0.21981326247547808, "5": 0.10774337896574801, "1": 0.10430723001111367}, "score": 2.9684071410265136}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2971026431659406, "2": 0.25586116649225754, "4": 0.21652369322469117, "1": 0.12138884389593697, "5": 0.10911527355723173}, "score": 2.9361148507189414}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2926114965957541, "2": 0.25137420336606536, "4": 0.21553484258037542, "1": 0.12448055002257503, "5": 0.11599124092430196}, "score": 2.947181616085046}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3006056818936753, "2": 0.2433227810490432, "4": 0.23611828308555238, "5": 0.11611796093046446, "1": 0.103825736066346}, "score": 3.017380117866097}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3177494499474464, "2": 0.2460154352744675, "4": 0.2369357432821291, "5": 0.10860048560406368, "1": 0.09069030667080863}, "score": 3.0267408952902244}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31420582945714287, "4": 0.24562964146193716, "2": 0.2341834725782924, "5": 0.11524776383808905, "1": 0.09072493884075608}, "score": 3.060492324220528}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3299683296119463, "4": 0.26994228556493205, "2": 0.2239839010550154, "5": 0.11583664652047489, "1": 0.060258821644092964}, "score": 3.157115607870319}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3156395124405177, "4": 0.2704606128459946, "2": 0.2105678605294813, "5": 0.1326979216216317, "1": 0.07062523938494016}, "score": 3.184039746126424}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "human", "scores": {"3": 0.289290356923831, "2": 0.2800274625742936, "4": 0.1765023479260674, "1": 0.16866595799201126, "5": 0.08549823897800654}, "score": 2.7301352278245696}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2890674289263153, "2": 0.2591682796205381, "4": 0.20072212301140674, "1": 0.1481514970577675, "5": 0.10287887022874544}, "score": 2.851006831441315}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29453512884472144, "2": 0.2614408280629682, "4": 0.19644309155993828, "1": 0.14630243898120135, "5": 0.10126537830853856}, "score": 2.844926105373487}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29796462725761313, "2": 0.2561414110751027, "4": 0.20929431748380917, "1": 0.13121755605884172, "5": 0.10537032805638145}, "score": 2.901457291534809}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28630717673713957, "2": 0.25499827463088337, "4": 0.20509745962740247, "1": 0.14597307384521793, "5": 0.10761142032899534}, "score": 2.87337428313465}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30479632875781787, "2": 0.2593234382624831, "4": 0.22862830874692439, "5": 0.10601140460969814, "1": 0.10123051864022319}, "score": 2.9788664310669306}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3144716028258077, "4": 0.2721805081196979, "2": 0.230002132123439, "5": 0.12013514038244053, "1": 0.06320192622816685}, "score": 3.1560461603959444}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31290535949325377, "4": 0.25878496838932497, "2": 0.23684070372813365, "5": 0.11642236767374546, "1": 0.07503542827355324}, "score": 3.10471931343203}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31281807107525567, "4": 0.25020124623662515, "2": 0.24494575527313442, "5": 0.11169498175643827, "1": 0.08033158482984944}, "score": 3.067982853209658}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3265893851648895, "4": 0.2587474990387486, "2": 0.2418628134830484, "5": 0.10390235656984008, "1": 0.06888726163401002}, "score": 3.086915804045325}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.28270404667665144, "3": 0.2584691072273105, "1": 0.18228809570603338, "4": 0.17688872790486576, "5": 0.09963786658976374}, "score": 2.7288809273005934}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.27924392387452224, "3": 0.2580476812730864, "1": 0.19562420139929018, "4": 0.17217375647939864, "5": 0.09489965583308169}, "score": 2.6914774152470886}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.27732330148869616, "3": 0.26115794537453524, "1": 0.1858500524541025, "4": 0.17970754489750035, "5": 0.09595120480646675}, "score": 2.722583787550712}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.261638290420816, "3": 0.25940321842165204, "4": 0.19550033226362046, "1": 0.16758300470231746, "5": 0.11586414940482205}, "score": 2.8304224650832013}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2832772440328485, "3": 0.2749899025471643, "4": 0.18029292314263623, "1": 0.16407592515957048, "5": 0.09734796026277763}, "score": 2.763555955605793}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29254610523402186, "2": 0.2735028326870169, "4": 0.20692501452834494, "1": 0.12660100891386308, "5": 0.10041552020060181}, "score": 2.881050072197512}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29338574500067793, "2": 0.2465297754237837, "4": 0.23386113031124545, "5": 0.12273557923289444, "1": 0.10347621494304864}, "score": 3.0258503821706038}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31375875015022886, "2": 0.27776920720501685, "4": 0.2124480481078753, "1": 0.10475497785711686, "5": 0.0912609311745983}, "score": 2.9076900011648488}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30358258401820915, "2": 0.2493955970654739, "4": 0.2339050535557815, "5": 0.1157607173274578, "1": 0.09734820363298254}, "score": 3.021334651236798}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2852388726829847, "2": 0.24307199592425893, "4": 0.2367610912671448, "5": 0.12964925671835179, "1": 0.1052720949695246}, "score": 3.042443702722603}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "human", "scores": {"2": 0.24620336440305282, "1": 0.22461840373179262, "3": 0.2213584158435959, "4": 0.1694887883122152, "5": 0.13830712820876348}, "score": 2.7506569136878682}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.24758359411485992, "2": 0.2431545328767301, "3": 0.20509005574275085, "4": 0.15996027113299274, "5": 0.14419266821212892}, "score": 2.710018412201429}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2660148086855139, "1": 0.24418063993348033, "3": 0.21825344494246224, "4": 0.153303233607003, "5": 0.11823399613596673}, "score": 2.635390077745568}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.23638115812254634, "3": 0.23077990843011792, "1": 0.19235510691871374, "4": 0.18670456084442064, "5": 0.15376304966920448}, "score": 2.873137231014291}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.27526494741100926, "2": 0.27159814858993736, "3": 0.20826416105145795, "4": 0.13734788021700925, "5": 0.10751009810130717}, "score": 2.5302330970734985}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2775623739671732, "3": 0.2738937011155483, "4": 0.1843010162894641, "1": 0.17472282811516876, "5": 0.08950645798924989}, "score": 2.7363023098425}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.29829969795989875, "3": 0.27939034191223217, "1": 0.17823469249165438, "4": 0.1667014985106075, "5": 0.07736281810880642}, "score": 2.6666544013117606}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2747618930030338, "3": 0.2726252329473508, "4": 0.18408013497763479, "1": 0.17493967128637433, "5": 0.093581131720697}, "score": 2.7465981382221756}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2768031431478963, "2": 0.26852176684367196, "4": 0.19098914213731447, "1": 0.161140648852962, "5": 0.10253396186651642}, "score": 2.805251793430802}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28688395011386486, "2": 0.2660550331654812, "4": 0.20026734100578641, "1": 0.1444671547550572, "5": 0.10231366880940942}, "score": 2.8499034068850198}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28737942443047415, "2": 0.26273916683722026, "4": 0.20578704644649548, "1": 0.13939819905504, "5": 0.10468836440435672}, "score": 2.873627224748571}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2884397077912693, "2": 0.23721561108654368, "4": 0.23546657680330207, "5": 0.13432023723791978, "1": 0.1045470572838029}, "score": 3.0577979504091126}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2851140794590475, "2": 0.25899347775831744, "4": 0.21318856994880758, "1": 0.13302808601621846, "5": 0.10966745812123053}, "score": 2.907473065771772}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28770086552506935, "2": 0.2568722755292628, "4": 0.2185013032354451, "1": 0.12428192566607059, "5": 0.11263392735521568}, "score": 2.9383324327432496}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2918120057432831, "2": 0.259986414826248, "4": 0.21091883241757822, "1": 0.12938808240967645, "5": 0.10788367668971212}, "score": 2.9079225944128337}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.280126217667097, "2": 0.25668002723370387, "4": 0.20047113654097407, "1": 0.1556154311873303, "5": 0.10709897200862886}, "score": 2.846756932002549}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28245642163330736, "2": 0.28203384429916806, "4": 0.18493725011663356, "1": 0.16036734324621452, "5": 0.09019811952220529}, "score": 2.7625632912829903}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2892212537122692, "2": 0.2742405330059013, "4": 0.1932676042369837, "1": 0.14940774005923307, "5": 0.09385537925602885}, "score": 2.8079209110042385}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2778113479900476, "2": 0.2586786296214306, "4": 0.20124329097687824, "1": 0.15362727537146384, "5": 0.10863283164476296}, "score": 2.8525747972992086}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28681533567961115, "2": 0.26500038504419715, "4": 0.20154399176694676, "1": 0.1483294300648175, "5": 0.09830510699745006}, "score": 2.836494020355548}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27599431811962233, "2": 0.24560463763715257, "4": 0.20470527852671522, "1": 0.15264837578230186, "5": 0.1210204184622226}, "score": 2.8958419169525857}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2682676775791315, "2": 0.22864671406658268, "4": 0.2125992374209616, "1": 0.15061201287971038, "5": 0.13984466612960278}, "score": 2.9624167139340902}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2693546139661225, "2": 0.2328408281152344, "4": 0.21944955294742569, "1": 0.13953133211015523, "5": 0.13880269703643214}, "score": 2.9851511432177293}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2752337616591738, "4": 0.23844814826121824, "2": 0.222173760124234, "5": 0.1485057946928542, "1": 0.11562003784564721}, "score": 3.0820474194967202}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2712980627396869, "4": 0.23175453644315722, "2": 0.2252664849599015, "5": 0.14788673533521782, "1": 0.12377107363888322}, "score": 3.054720639299344}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26967433895204995, "4": 0.2503750713559224, "2": 0.21196595644744348, "5": 0.16236688210103223, "1": 0.10561122669090478}, "score": 3.1519214169328245}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2668868214897388, "4": 0.2598976186341964, "2": 0.20508521567454835, "5": 0.16748499731452257, "1": 0.10063672784725552}, "score": 3.1885105666742475}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2692358816932777, "4": 0.2628240190128385, "2": 0.20588374791431224, "5": 0.165276425629045, "1": 0.09677353701677893}, "score": 3.1939472874006385}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26787894453888356, "4": 0.25987152622314647, "2": 0.2072611679602452, "5": 0.16657332102133543, "1": 0.09840890313526383}, "score": 3.18894035358488}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.25980625469420654, "4": 0.2559018004717491, "2": 0.20576764164296643, "5": 0.17189054001770396, "1": 0.10662732158955668}, "score": 3.180661759432943}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28710617037791075, "2": 0.27756464998797137, "4": 0.17883360258133546, "1": 0.16325183017753753, "5": 0.09323016041853166}, "score": 2.761222368933404}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2808413387205954, "2": 0.26013886354097193, "4": 0.20415572877773702, "1": 0.14087047891795074, "5": 0.11398162816751965}, "score": 2.8902378507747692}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2951606484058304, "2": 0.27797889095250183, "4": 0.18974092309064808, "1": 0.13960896102367448, "5": 0.09749829386031565}, "score": 2.8275385795252252}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28891605505532153, "2": 0.2579607080598879, "4": 0.204903426722423, "1": 0.13602210087704056, "5": 0.11218576114083045}, "score": 2.8992688356396084}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2843110766362228, "2": 0.25196928092311666, "4": 0.21136871628738946, "1": 0.13264458777796065, "5": 0.11969117441563468}, "score": 2.9334916001089266}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2933311216605496, "3": 0.2901449364466364, "4": 0.17487427357014532, "1": 0.1583447438169396, "5": 0.08329217265089253}, "score": 2.731434584870313}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3151284643375535, "3": 0.30286885165309624, "4": 0.15778790833929773, "1": 0.15712328924358318, "5": 0.0670816664238784}, "score": 2.6625728848271892}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2902948640437687, "2": 0.2789385701716148, "4": 0.183349813801716, "1": 0.15753282968391505, "5": 0.08987582352308869}, "score": 2.769095361263526}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2994440770189279, "2": 0.2818285138305311, "4": 0.18490769950522165, "1": 0.1459721834121833, "5": 0.0878400615952669}, "score": 2.786813350679722}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.29610836312936956, "3": 0.29298364225639634, "4": 0.1697455207883283, "1": 0.16029731008704004, "5": 0.08085692857259759}, "score": 2.714754045582212}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2812866001678666, "2": 0.26903134015881924, "4": 0.17745869524344637, "1": 0.16876511210910652, "5": 0.10344424573212868}, "score": 2.7777825098216997}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3046723932948967, "4": 0.23731621183149518, "2": 0.2297280180538796, "5": 0.1361064879497308, "1": 0.09216350970713265}, "score": 3.095475427644108}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31097420884518906, "4": 0.2343455601907125, "2": 0.23304623770924635, "5": 0.13220147424505369, "1": 0.08942179809120307}, "score": 3.086859606003933}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.316902444032624, "2": 0.24904387331158165, "4": 0.21815787086582814, "5": 0.11581394476260183, "1": 0.10005995726659227}, "score": 3.000621986173834}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30433037737484525, "2": 0.24577875933658244, "4": 0.22260150036037446, "5": 0.1210715724991514, "1": 0.10620303419585404}, "score": 3.0065599144300137}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28126409813994635, "2": 0.25575313913323017, "4": 0.20929578254915926, "1": 0.1396552630315986, "5": 0.11401852999279563}, "score": 2.90226788852999}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28462063234853396, "2": 0.239510529161855, "4": 0.22648349646565452, "5": 0.12729920735867797, "1": 0.12207526478516312}, "score": 2.9974208244154994}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2891928824989108, "2": 0.251536593256651, "4": 0.2213308805693945, "1": 0.12040899976767754, "5": 0.11752036984971485}, "score": 2.964016657781886}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2831163882456061, "2": 0.24444080639799354, "4": 0.23102923916467832, "5": 0.12388271595967154, "1": 0.11752247348316262}, "score": 2.9993089119306315}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28540778408845596, "2": 0.2466825232678049, "4": 0.21550943252038765, "1": 0.13547905855716308, "5": 0.11690749475817477}, "score": 2.931682845244482}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2918547593337485, "4": 0.25801622717790523, "2": 0.21582750031701126, "5": 0.14927537864384427, "1": 0.08501188574273248}, "score": 3.170718145189223}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28746283404159306, "4": 0.2738551395972258, "2": 0.2120022481256663, "5": 0.1482692650203447, "1": 0.07840277161645104}, "score": 3.201587438888406}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2908147536245093, "4": 0.2744873782401243, "2": 0.2109108598363956, "5": 0.14773911457933273, "1": 0.07603724446388829}, "score": 3.2069824628438006}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29417601509146246, "4": 0.2793821838333569, "2": 0.20573334303597285, "5": 0.15307420119827778, "1": 0.0676259631096308}, "score": 3.244547345184649}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2917436421994393, "3": 0.29131768682130116, "2": 0.1960916945133134, "5": 0.1596785575242986, "1": 0.06115687467672116}, "score": 3.2926986923725288}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26966363309330627, "2": 0.25843134764914893, "4": 0.2033513922667537, "1": 0.1510104408281957, "5": 0.11752813820290313}, "score": 2.8779536028177546}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27398960808784467, "2": 0.2535647917121541, "4": 0.20975921528233274, "1": 0.14656462815300747, "5": 0.1161019377574804}, "score": 2.8952669670743933}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2797182590691085, "2": 0.2604417893887207, "4": 0.203118749106742, "1": 0.1473657481062826, "5": 0.10934009682228402}, "score": 2.866623608821181}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2810545501053776, "2": 0.2478727424000231, "4": 0.21907971937329404, "1": 0.130050232410934, "5": 0.12192553371395874}, "score": 2.9549568038455574}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2743484678904349, "2": 0.2555117454359185, "4": 0.20863052800989126, "1": 0.15067933643059328, "5": 0.11081065999008226}, "score": 2.8733789906882903}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3084281697076025, "2": 0.2516304339061288, "4": 0.2282084530392156, "5": 0.1072075289574082, "1": 0.1045167430329694}, "score": 2.9819594345457863}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28985934236283206, "4": 0.2422637185726035, "2": 0.23592427360567636, "5": 0.1338313036676465, "1": 0.09811441316621199}, "score": 3.0777737663905365}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3205591385456032, "4": 0.25886095881089205, "2": 0.22605962207762784, "5": 0.12642251349958653, "1": 0.06808597732671964}, "score": 3.1494761713641304}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3096903350341358, "4": 0.24391423777568025, "2": 0.23894982173332335, "5": 0.11800816051510869, "1": 0.08942723510181046}, "score": 3.06212690117467}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2967020922424235, "2": 0.24455300602628527, "4": 0.2297095716346635, "5": 0.12493141153437635, "1": 0.10409243255496961}, "score": 3.026834831792265}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "human", "scores": {"2": 0.27219460743518764, "3": 0.263748125849762, "1": 0.18973382691282387, "4": 0.17407500664157527, "5": 0.10023817248050643}, "score": 2.722886246966169}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2765834210241381, "2": 0.2525545535347426, "4": 0.20152502736961037, "1": 0.15929024509582332, "5": 0.11003470092314603}, "score": 2.850457583196449}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28395289989924444, "2": 0.2661970912541156, "4": 0.184431197192025, "1": 0.1620929569469967, "5": 0.10331631265295435}, "score": 2.80067891541714}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2758434732631049, "2": 0.26441228721911525, "4": 0.18784430953903272, "1": 0.16824643489721228, "5": 0.103644531580659}, "score": 2.7942263712347097}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2843149148616654, "2": 0.265194701534728, "4": 0.18417564211128146, "1": 0.1614650126059729, "5": 0.10483928714566702}, "score": 2.8057274611124683}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2994990899486592, "2": 0.28171957998535324, "4": 0.18369819731685127, "1": 0.14965524452877105, "5": 0.0854082140122202}, "score": 2.773480099698728}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2984349777085553, "4": 0.24596584356172876, "2": 0.22127606369962705, "5": 0.14226616136803946, "1": 0.09204299262018051}, "score": 3.125137864412784}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31188014987108137, "2": 0.2504689295205879, "4": 0.21298905490830627, "1": 0.11700838266985378, "5": 0.10763784217583512}, "score": 2.94377816504215}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2851754711289311, "4": 0.2586463744074712, "2": 0.20433820300492733, "5": 0.1600879863833755, "1": 0.09174004493546581}, "score": 3.1910063311205383}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3023072483934676, "2": 0.24276526261183706, "4": 0.22895250469900505, "5": 0.11909408118922302, "1": 0.10686873214943322}, "score": 3.0106380696422357}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2984644943874264, "2": 0.2606681856031121, "4": 0.20671192947549089, "1": 0.1246196724823789, "5": 0.10952307733640618}, "score": 2.9158494898578016}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3077552360776764, "4": 0.2500481949248773, "2": 0.23132956428322068, "5": 0.12304133784885316, "1": 0.08781434579020939}, "score": 3.0891736243002477}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3081482440349958, "4": 0.2557539319691904, "2": 0.2233314026842475, "5": 0.1399479375749404, "1": 0.0728094153799505}, "score": 3.166701085379823}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3003099713245966, "4": 0.26991540065218067, "2": 0.20558691303099902, "5": 0.1540347581134486, "1": 0.0701404793573432}, "score": 3.2321199414149366}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3040965285050854, "2": 0.241653716772574, "4": 0.24088888738545786, "5": 0.12287383275630094, "1": 0.09047835754723577}, "score": 3.064026676592622}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3599785257520156, "3": 0.3006580519647619, "1": 0.1756511417761893, "4": 0.12104455233973159, "5": 0.04265693993471164}, "score": 2.49507217562595}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3255546291257874, "2": 0.24644466338776855, "4": 0.24022295685153627, "5": 0.10430645814046748, "1": 0.08346036754352053}, "score": 3.03547086217509}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3365560083210601, "3": 0.32304785785543316, "4": 0.15879233493585052, "1": 0.13076683855102914, "5": 0.050827771027483995}, "score": 2.662355088844231}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31456542369761803, "2": 0.30902061163148875, "4": 0.168504537629565, "1": 0.14277791470016693, "5": 0.06511972371517104}, "score": 2.704164056528792}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32262110301788727, "2": 0.25831283237353875, "4": 0.21856131193213052, "1": 0.10066787973503018, "5": 0.09982675953423621}, "score": 2.9585658201162714}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2985795746303044, "2": 0.25831383979554945, "4": 0.21207058746252977, "1": 0.12425893563646566, "5": 0.10676399871151938}, "score": 2.9187658125928646}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27758024955964455, "2": 0.2486922725566234, "4": 0.22197844420497034, "1": 0.12784329792643787, "5": 0.1238946092712735}, "score": 2.9653884092328093}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29431195581032277, "2": 0.2635786166742161, "4": 0.213387738412709, "1": 0.12450691779531835, "5": 0.10420675755398127}, "score": 2.909208073671706}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.296350323243432, "4": 0.23976348996566121, "2": 0.23405175801140166, "5": 0.12881117585700197, "1": 0.1010131068265952}, "score": 3.0613084920569134}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2762434601763974, "2": 0.23316579778312732, "4": 0.22452394909638532, "5": 0.13822392001886305, "1": 0.12783060371723168}, "score": 3.0121449329252283}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27520018518845774, "2": 0.2671919406533559, "4": 0.1854006722338796, "1": 0.16973099119362434, "5": 0.1024653383533311}, "score": 2.783675073933711}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2862583368989449, "2": 0.2619959063398939, "4": 0.2051833724323801, "1": 0.13817041007722497, "5": 0.10837550328181868}, "score": 2.883595735210551}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28360257632603514, "2": 0.27014976191476553, "4": 0.1912253697863303, "1": 0.15753519269408284, "5": 0.09747128082591573}, "score": 2.800944635387327}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2929583588590639, "2": 0.2561073721435079, "4": 0.21274366259711228, "1": 0.12571080606206828, "5": 0.1124612006426485}, "score": 2.930135780161543}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2811960685831129, "2": 0.2526401082498979, "4": 0.21271183852568767, "1": 0.13566563319010783, "5": 0.11776991863611275}, "score": 2.924279056859543}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29655543898369163, "4": 0.25151730113981036, "2": 0.21816053240808808, "5": 0.14745327987311777, "1": 0.08629909220581936}, "score": 3.1556673787321694}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2861771369275272, "3": 0.27437579435867226, "5": 0.20347451812477435, "2": 0.17525284837321575, "1": 0.06071056156037109}, "score": 3.3964558255492165}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3006540833046692, "4": 0.25656339266853884, "2": 0.20892300333308808, "5": 0.15783034321296324, "1": 0.07601276441267066}, "score": 3.211279014672886}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.28641436157178274, "3": 0.27305309923993293, "5": 0.20685130027864193, "2": 0.17465167799798242, "1": 0.059018430647627663}, "score": 3.407432957672223}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2653665768548499, "3": 0.25435208764046124, "5": 0.22308417776107103, "2": 0.17754469481300525, "1": 0.0796430104318648}, "score": 3.374707758624876}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31122156276116003, "2": 0.24915183231930202, "4": 0.2342360292461765, "5": 0.10458712739309664, "1": 0.10079689776090128}, "score": 2.9926646081406387}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3152371708902709, "2": 0.2647554789257311, "4": 0.21628008964122966, "1": 0.11023439683245967, "5": 0.09348640073036144}, "score": 2.9180280887284837}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.308023684881262, "2": 0.2642845012078408, "4": 0.21594848394463512, "1": 0.1171487832897375, "5": 0.09458829898034508}, "score": 2.906542430223508}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3180020339987283, "2": 0.25994500228896233, "4": 0.22489629368233352, "1": 0.10146812187781198, "5": 0.09568296505239417}, "score": 2.95338071746243}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3195023340085981, "2": 0.25756406337901094, "4": 0.22868801139217937, "1": 0.09987267043237666, "5": 0.09436799493708818}, "score": 2.960114400552081}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29914256895085184, "4": 0.23537676343724048, "2": 0.2348467042577953, "5": 0.12343161512004928, "1": 0.10719589757153046}, "score": 3.0330017071593582}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29534320266557335, "4": 0.24128714058519837, "2": 0.231813989106233, "5": 0.1287114888384776, "1": 0.1028360198177685}, "score": 3.0612245890509944}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29659538769180777, "2": 0.25231905525700127, "4": 0.21135231471139493, "1": 0.13027000772145025, "5": 0.10945423087297358}, "score": 2.9174009620567345}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29729023355160444, "4": 0.25408653017452426, "2": 0.2276770048074721, "5": 0.1300971239714141, "1": 0.09084183151135894}, "score": 3.104920873689722}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2962461151608128, "4": 0.2391567940743775, "2": 0.2299663235792349, "5": 0.13347053995345357, "1": 0.10115415890500877}, "score": 3.0738236805782737}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2744496113752984, "2": 0.24108832954644077, "4": 0.22706846478331924, "5": 0.1300097800763179, "1": 0.12737510030011373}, "score": 2.991249418537433}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2775903814236589, "4": 0.24084372495318343, "2": 0.2271602189761907, "5": 0.14207516932493697, "1": 0.11232172285651788}, "score": 3.073191041711631}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28157343361625353, "2": 0.23805660439408363, "4": 0.23672044287753838, "5": 0.12940936849996576, "1": 0.11423124731117022}, "score": 3.0290203392378614}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2752402022045507, "4": 0.24839335015343902, "2": 0.2190078511080013, "5": 0.15861948834456818, "1": 0.09873058520986659}, "score": 3.149164576641481}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26832528083299584, "4": 0.25852227979127784, "2": 0.20418249534829014, "5": 0.1715294683539499, "1": 0.09742948435746286}, "score": 3.2025419786388567}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2785828715400644, "2": 0.2694258137992372, "4": 0.2035017244865524, "1": 0.1405271739517747, "5": 0.10795203185632332}, "score": 2.868924265358004}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27754214040763314, "2": 0.24785930806145887, "4": 0.21901058872325022, "1": 0.13355049940129834, "5": 0.12202591973138525}, "score": 2.948101522222806}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2859433113133502, "2": 0.24530861698049672, "4": 0.22998814841891482, "5": 0.12397136096650455, "1": 0.11477774187514735}, "score": 3.0030668028053062}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2823762718746366, "2": 0.2619865270543371, "4": 0.21501155674430164, "1": 0.13091975509462075, "5": 0.10969677615096644}, "score": 2.910578256895056}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2824791320425529, "2": 0.2654551975492633, "4": 0.20223829472429128, "1": 0.1421811827265194, "5": 0.10763435476624493}, "score": 2.8676878749182535}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2914734668929788, "3": 0.2717282209203132, "1": 0.18650955648586137, "4": 0.16165305114194362, "5": 0.08861507403565108}, "score": 2.6743839017180573}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.27644104487853705, "3": 0.26473705258564195, "1": 0.17931771542304228, "4": 0.1760262407301286, "5": 0.1034522836622916}, "score": 2.7478478614202695}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.292809339559801, "2": 0.27313819584301835, "4": 0.19995874674198347, "1": 0.132206775630463, "5": 0.10187310589863378}, "score": 2.8661513594618677}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27433464107609185, "2": 0.26358109432485777, "4": 0.19844638819386326, "1": 0.15013959264630194, "5": 0.11348554579433559}, "score": 2.8615554366631333}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.27429823928453334, "3": 0.26620552983565915, "4": 0.1848614413859375, "1": 0.1698977488916055, "5": 0.10472109510261113}, "score": 2.78020638980448}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.25733979701679693, "2": 0.2561908767573392, "1": 0.19329193816014545, "4": 0.17695698474198876, "5": 0.11620448942309759}, "score": 2.7665874960071593}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2703603987136996, "3": 0.257437038359843, "1": 0.1892029746947213, "4": 0.17220457834028272, "5": 0.11077488500415376}, "score": 2.7449828680544086}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.27701339958824434, "3": 0.2437050734849436, "1": 0.21776275252099492, "4": 0.15678552349143265, "5": 0.10471512617030647}, "score": 2.653670594069963}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2627620524153042, "3": 0.2582687679631369, "1": 0.18416984066992814, "4": 0.17562116068524702, "5": 0.11916031590991027}, "score": 2.7828361796923358}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2593964999652993, "2": 0.2574377591845595, "4": 0.18242296585044904, "1": 0.1814122161233399, "5": 0.11931661366717593}, "score": 2.800791223745507}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27264767092733255, "2": 0.2636907668704048, "4": 0.1969524401399866, "1": 0.15583607897278873, "5": 0.11086278650006362}, "score": 2.843313481254841}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28794355719931075, "2": 0.25732983815935756, "4": 0.20581145423755742, "1": 0.13913659924939123, "5": 0.10976820102526674}, "score": 2.8897436784627866}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28674602079001926, "2": 0.2773275445676684, "4": 0.19198013036343858, "1": 0.1498194315034554, "5": 0.09411831669042736}, "score": 2.8032486727486363}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2864976629795654, "2": 0.26078892899583955, "4": 0.2054234542165625, "1": 0.13868795465849593, "5": 0.10858888769154071}, "score": 2.884434876059544}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28584224821675575, "2": 0.268342185858191, "4": 0.1917221290031232, "1": 0.15550076931682594, "5": 0.09858230460108759}, "score": 2.809541039986488}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27009241520787935, "4": 0.2287915847709811, "2": 0.2287549352948022, "5": 0.14356324631630787, "1": 0.12877790822697746}, "score": 3.0296079151538504}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3001039092888605, "3": 0.26520422219540796, "5": 0.20889578243923348, "2": 0.17000835433369116, "1": 0.055775571064382454}, "score": 3.436341283910908}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28184415574710786, "2": 0.23539305207285063, "4": 0.23168129041133276, "5": 0.13480332697298533, "1": 0.11626625689894186}, "score": 3.0333627761006907}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2738796233411128, "3": 0.26873347225968314, "2": 0.19568925726119313, "5": 0.17808096011287722, "1": 0.08360076568683422}, "score": 3.267155008397273}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28001973392298246, "4": 0.23766415863964432, "2": 0.23322829459113145, "5": 0.13977712348763435, "1": 0.10929312347562577}, "score": 3.0654050129693338}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2837878860444565, "2": 0.2805523052285463, "4": 0.1801029404807251, "1": 0.15644957897284711, "5": 0.0990939885430743}, "score": 2.7848365925621694}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27039514225715916, "2": 0.26999730540906186, "1": 0.18017629333171573, "4": 0.1745359572199076, "5": 0.10488382184719226}, "score": 2.7539508842139524}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2799410874261411, "3": 0.2704183972393432, "1": 0.18395614356008652, "4": 0.16721531259817318, "5": 0.09846010876410413}, "score": 2.716279616165696}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28425205978287443, "2": 0.25816708174564335, "4": 0.19453493843480288, "1": 0.15036767762063608, "5": 0.1126678690705905}, "score": 2.8609667973496284}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2713474163458736, "2": 0.2665400140814568, "1": 0.18485484195028065, "4": 0.17441919682971996, "5": 0.10282680612317248}, "score": 2.7438201074694746}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "human", "scores": {"3": 0.34746810582085064, "2": 0.3004144973810965, "4": 0.1923940242932031, "1": 0.09900177497181872, "5": 0.06070967519264281}, "score": 2.81539312640777}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3222363488648777, "4": 0.25963086675681374, "2": 0.23559357461704808, "5": 0.10963684324095925, "1": 0.07289319437132434}, "score": 3.0975254843973072}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3359468889883925, "2": 0.27359578474122354, "4": 0.21650929487784204, "1": 0.09312392928120515, "5": 0.08081400494075835}, "score": 2.9182928364445564}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3358156937576502, "2": 0.2854791164063015, "4": 0.21113441719873235, "1": 0.09521658882514776, "5": 0.07234459029645636}, "score": 2.879910151651201}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3136573597077584, "2": 0.267519397836111, "4": 0.22126885021753084, "1": 0.1048752531889818, "5": 0.09266778367365601}, "score": 2.9293337109084883}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "human", "scores": {"1": 0.28211759257935753, "2": 0.2652105341310079, "3": 0.2111524910783956, "4": 0.13860692909576894, "5": 0.10289296559947762}, "score": 2.5149376883454453}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2542688009706956, "3": 0.22711876601892494, "1": 0.219105616126592, "4": 0.17035346408120447, "5": 0.12913715789023703}, "score": 2.7361434735044803}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.25867969020598625, "3": 0.23529792542759292, "1": 0.21874235564016206, "4": 0.1707688997466065, "5": 0.11649536408848986}, "score": 2.7075906166351724}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2563622232522894, "3": 0.24084702453481738, "1": 0.20177521464264916, "4": 0.18071152566363802, "5": 0.12029099660391021}, "score": 2.761377760593195}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.26436152493330456, "3": 0.23160192999645315, "1": 0.21830646514328145, "4": 0.1681987437934523, "5": 0.11751194394126907}, "score": 2.7022424022835474}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.27754674764540394, "3": 0.2597353372673442, "4": 0.1862046018295784, "1": 0.17200003477301715, "5": 0.10450432718141331}, "score": 2.7736644130024923}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2882463161403934, "2": 0.2540244898192913, "4": 0.22341346971638432, "1": 0.12020501928189384, "5": 0.11410167980558474}, "score": 2.9571819145011284}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2947600922844593, "3": 0.27641022342036126, "4": 0.17573623022665671, "1": 0.1703969779124105, "5": 0.0826870317508578}, "score": 2.7055534647466875}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27692100333069436, "2": 0.25437739693229783, "4": 0.21172659136802105, "1": 0.1372870485812753, "5": 0.11967676446573142}, "score": 2.9221277543997726}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.28375513881195863, "3": 0.27462287119142176, "4": 0.18876479685346573, "1": 0.15955399298941006, "5": 0.09329273884888795}, "score": 2.7724847696542785}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "human", "scores": {"3": 0.319504570532764, "2": 0.23985214691512885, "4": 0.23266254033383602, "5": 0.10841194525157388, "1": 0.09955822799539173}, "score": 3.0105179390948678}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3251735627401901, "2": 0.259971440040032, "4": 0.21614677244387268, "1": 0.1031402259139081, "5": 0.09555701442012411}, "score": 2.9410082614249493}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3242495641387685, "2": 0.2658032248920186, "4": 0.20440803729940382, "1": 0.11917539064332971, "5": 0.08634917746744654}, "score": 2.872950530427091}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3162274961156134, "2": 0.26812092166204105, "4": 0.2079122215773813, "1": 0.12259654953040734, "5": 0.08513372699518741}, "score": 2.8648644272572263}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3108054889283392, "2": 0.26332578161810116, "4": 0.2057502550118431, "1": 0.12481214650729984, "5": 0.09529898680647071}, "score": 2.8833972979967295}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2963302017396165, "2": 0.24212121252998464, "4": 0.2259647647614421, "5": 0.12053039707250264, "1": 0.11504754514690302}, "score": 2.994809225567394}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31831354226420255, "2": 0.26431383841565986, "4": 0.22454754780352565, "1": 0.09790745335643766, "5": 0.09491217392323596}, "score": 2.954242901408976}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3196740807070989, "2": 0.2813977021819218, "4": 0.21105481342024252, "1": 0.10404480035005081, "5": 0.0838225260782538}, "score": 2.889211889406304}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31024710069547184, "4": 0.2495398392961075, "2": 0.2303512410370517, "5": 0.1221206241710151, "1": 0.08773248830740257}, "score": 3.0879656358584695}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3045968439098705, "2": 0.2397589345026289, "4": 0.23826728243549009, "5": 0.1204813511824098, "1": 0.0968870705349494}, "score": 3.0456972984515356}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27568722462057454, "2": 0.24835346138455824, "4": 0.2244782406736246, "1": 0.13083987914471187, "5": 0.12063354288333233}, "score": 2.9557117679040585}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26886537213350836, "4": 0.2630381763800727, "2": 0.21120881295795502, "5": 0.16049909099671078, "1": 0.09638448830617222}, "score": 3.180059299704511}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2794626574899512, "4": 0.2448602106620536, "2": 0.23048822556446447, "5": 0.13578057708097693, "1": 0.10940157416729694}, "score": 3.0671304443934684}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2708546361461464, "4": 0.2556966495043049, "2": 0.20903294664319347, "5": 0.16500706298962167, "1": 0.09940382352630524}, "score": 3.1778710500102108}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.27568871333560707, "3": 0.26935170495200034, "2": 0.19462273240385466, "5": 0.1800165118138338, "1": 0.08031619477261061}, "score": 3.2804677769142545}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3061355503849658, "4": 0.24720597079224144, "2": 0.2360525569050502, "5": 0.12023660128857414, "1": 0.09036396575089034}, "score": 3.0708990646184198}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29797645668812794, "4": 0.2692403779700459, "2": 0.2126907172888088, "5": 0.14287879436277878, "1": 0.07720474964075066}, "score": 3.1878994231910562}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3149099040363318, "4": 0.2691820937377112, "2": 0.2187896528500956, "5": 0.12668782365782746, "1": 0.07042570180409423}, "score": 3.162917470494939}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.30560639373527787, "3": 0.2931228718562049, "2": 0.1739383939881752, "5": 0.17321600144939694, "1": 0.054109467956706354}, "score": 3.3698836082080224}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29844145381783715, "4": 0.29438501310378995, "2": 0.1898036997706969, "5": 0.16274641919655314, "1": 0.054616567947427086}, "score": 3.3208432123764977}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3031169725349443, "4": 0.24409521607334347, "2": 0.22979485565538926, "5": 0.12201055763515538, "1": 0.10097373959072692}, "score": 3.0563744846258745}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.33269893401683653, "2": 0.2516344348618355, "4": 0.23784223577602784, "5": 0.10010738691790912, "1": 0.07770598480946007}, "score": 3.0310109469839217}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3223383205767327, "4": 0.24407974092721177, "2": 0.24331326731429886, "5": 0.10519166624709093, "1": 0.08507151698128422}, "score": 3.041006997189015}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.32248604983741, "4": 0.25740416574900526, "2": 0.22548694844660094, "5": 0.11986445695136147, "1": 0.07475046843814055}, "score": 3.1221461605755136}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3308539300330295, "2": 0.2450144721945862, "4": 0.23990362470922655, "5": 0.10147721382884556, "1": 0.08273992701912183}, "score": 3.0323640767087316}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26965009631870085, "2": 0.24981643270688322, "4": 0.21156360348654735, "1": 0.1454117798957083, "5": 0.12354809074069824}, "score": 2.9180189729174932}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27226092211835934, "2": 0.24699257587305395, "4": 0.22251699461511867, "1": 0.13564443030868856, "5": 0.1225793626989882}, "score": 2.949393994340424}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28822971363074057, "2": 0.240930612954083, "4": 0.23610482472698338, "5": 0.1243392452760157, "1": 0.11038897657374179}, "score": 3.0230749020910963}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2761895150965335, "2": 0.23777576816041043, "4": 0.23502083716067293, "5": 0.13611719995184418, "1": 0.11488813076833261}, "score": 3.0397035467874365}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27117866361414444, "4": 0.2375792564044499, "2": 0.22615684861732913, "5": 0.14816770571814322, "1": 0.11690999660533227}, "score": 3.073938382697828}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2942772584761808, "2": 0.271053868799013, "4": 0.1868047920768711, "1": 0.15768481185800745, "5": 0.0901674844246695}, "score": 2.7807136842611415}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29518420316539556, "2": 0.2812045327121618, "4": 0.1826649095500587, "1": 0.15175028059246326, "5": 0.0891859110269193}, "score": 2.7763293645526526}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30592625585847844, "2": 0.289340929298118, "4": 0.17724305434135346, "1": 0.1542713058946424, "5": 0.07320207583612173}, "score": 2.7257591731984143}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2834943742291822, "2": 0.25301902384961317, "4": 0.21322315193937694, "1": 0.1342646804484887, "5": 0.11598759885651769}, "score": 2.9236491120147274}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29103725382131124, "2": 0.28154654463731243, "4": 0.1761439888419983, "1": 0.1681880803311311, "5": 0.0830741746324985}, "score": 2.724366888125729}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4844108832839286, "2": 0.28635215912787926, "3": 0.13447526502666135, "4": 0.05302562456030519, "5": 0.04171573847166758}, "score": 1.8812604323587956}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.38080560391875784, "2": 0.3070288382926359, "3": 0.17289472426053268, "4": 0.08180033009421304, "5": 0.05745862243777818}, "score": 2.128067169409073}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.4766932675044483, "2": 0.292652201685904, "3": 0.13426583512970566, "4": 0.05409961010972179, "5": 0.042269415173379066}, "score": 1.8925779203299016}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.4371781067437706, "2": 0.291263972792437, "3": 0.1539294959355138, "4": 0.06654898406483921, "5": 0.05106421094726895}, "score": 2.0030420364919723}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.4319093848637481, "2": 0.29438271690964296, "3": 0.1544217628844512, "4": 0.06834867510360346, "5": 0.0509241504186543}, "score": 2.011982338966647}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2902219221099724, "2": 0.2768265893670543, "4": 0.18677938835264105, "1": 0.15177296895532472, "5": 0.0943838595304188}, "score": 2.7951714520587956}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.32056317761619496, "2": 0.28247006460794744, "4": 0.2039384798462985, "1": 0.10463811558380076, "5": 0.08837651606539607}, "score": 2.8889437006961454}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3173034840978232, "2": 0.2689552150617636, "4": 0.21671134897148253, "1": 0.10349448010683936, "5": 0.09352977913250271}, "score": 2.927826321103026}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31022864154214574, "2": 0.29244961019163757, "4": 0.19628409596675475, "1": 0.1183344430892254, "5": 0.08269320870283586}, "score": 2.832550342420798}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2945960744674867, "2": 0.26283805419018963, "4": 0.21706125156381226, "1": 0.1197569747653733, "5": 0.10573778246245984}, "score": 2.926184084754591}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29527123629654195, "2": 0.26408538502563966, "4": 0.20606846727522318, "1": 0.12876581654910813, "5": 0.1057948962843336}, "score": 2.896039765633457}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2840432680888088, "2": 0.2528102175506236, "4": 0.2136828441382826, "1": 0.13280932845722654, "5": 0.11664205413267681}, "score": 2.9285371998299423}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2989380851831712, "2": 0.24878980391646638, "4": 0.22367957946783448, "5": 0.11489555278130868, "1": 0.1136854903301506}, "score": 2.977309639779541}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28239561531176516, "2": 0.2534387759779997, "4": 0.21657269808115825, "1": 0.1259770791608971, "5": 0.12160519358003523}, "score": 2.9543896657438014}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28800492450980464, "2": 0.24853161952268302, "4": 0.22974414552681469, "5": 0.12230582605691073, "1": 0.11140129798343112}, "score": 3.0030216189737495}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28962123380748434, "2": 0.26370616686086534, "4": 0.20998239187382664, "1": 0.13343270641853372, "5": 0.10324773339218705}, "score": 2.8859051645221783}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2932290601899376, "2": 0.25045693234619854, "4": 0.22312159211478744, "1": 0.1201581724964094, "5": 0.11302033734038873}, "score": 2.958388410826083}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30772581608340555, "2": 0.24840102562654423, "4": 0.23865268137435303, "5": 0.1059958644769019, "1": 0.0992144609112975}, "score": 3.0038145016020352}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2997718181200925, "4": 0.24129785397207576, "2": 0.2409028111655421, "5": 0.1215206830287297, "1": 0.09649819263341496}, "score": 3.050440459457216}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2550248468354877, "2": 0.22895799962505667, "4": 0.213352895040065, "5": 0.18407996930558784, "1": 0.11857495342594178}, "score": 3.1154060045779683}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29067382986905865, "3": 0.267705174277631, "1": 0.19244347591170724, "4": 0.16639353558458295, "5": 0.08277206944843175}, "score": 2.656372798502279}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2851684273817849, "2": 0.28102804791090075, "4": 0.18645100167871062, "1": 0.15840893394886016, "5": 0.08893649529048314}, "score": 2.766476419883991}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2899880974847341, "3": 0.28440795792282275, "4": 0.1764794570560464, "1": 0.1659528777333917, "5": 0.08316351075602624}, "score": 2.720910365256518}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27960653394319024, "2": 0.2738320819652116, "4": 0.1922666439175813, "1": 0.1541006374600184, "5": 0.10018171419992193}, "score": 2.810594368977851}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2869579757218871, "3": 0.27967507390388885, "4": 0.17690604615904237, "1": 0.16840775957485482, "5": 0.08804261679228241}, "score": 2.729214934087984}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2908040809188967, "3": 0.2845192969851869, "4": 0.1725657251010473, "1": 0.16481167839008426, "5": 0.08728741365611913}, "score": 2.7267098885384837}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2973089039645163, "3": 0.282499725521902, "4": 0.17301799025113124, "1": 0.16477466584378242, "5": 0.08238588131600581}, "score": 2.7109278075379395}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2995782879775597, "2": 0.2972140775497689, "4": 0.18062429919721093, "1": 0.13906596362019652, "5": 0.08350656729321082}, "score": 2.7722889687210452}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2830097300861743, "2": 0.2679574177735832, "4": 0.19671305218361204, "1": 0.1432798884178321, "5": 0.10902800534316313}, "score": 2.8602502043722837}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29434495002986055, "2": 0.2766755663076262, "4": 0.19636268421875944, "1": 0.13413497632444976, "5": 0.09846823205815844}, "score": 2.848351568315443}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2613916556680183, "2": 0.2506434920255726, "4": 0.1895759961045752, "1": 0.17422305072194205, "5": 0.12414499276250046}, "score": 2.8387730325888105}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2644612080172851, "2": 0.2516964200563053, "4": 0.19529327029268292, "1": 0.16745853677538455, "5": 0.12107524102337601}, "score": 2.850827972844835}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2666275868591238, "2": 0.25015881570347437, "4": 0.19510648354471213, "1": 0.16657242152783053, "5": 0.12151929770083957}, "score": 2.854839185485288}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2728937100734824, "2": 0.24402292577706397, "4": 0.2126936737103262, "1": 0.14135548375736276, "5": 0.12901852245568546}, "score": 2.943995946949678}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2714684371384028, "2": 0.25195713629646405, "4": 0.19790869322026824, "1": 0.15775979303917934, "5": 0.12088322282677562}, "score": 2.8721955131032613}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3082104962675546, "2": 0.254356259048904, "4": 0.2268747218430311, "1": 0.10629955286425957, "5": 0.10424851114374303}, "score": 2.9684160490218403}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3131833428588312, "4": 0.25420913108564264, "2": 0.2323265160507329, "5": 0.12361995484792805, "1": 0.07664984468152702}, "score": 3.1158241338113077}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32274565880137185, "2": 0.26310449666365865, "4": 0.21792541669141247, "1": 0.10019077103624847, "5": 0.0960186342096481}, "score": 2.9464758423026667}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3045449754840745, "4": 0.2586217783068282, "2": 0.2179317802064867, "5": 0.13827825269510202, "1": 0.08061238348645595}, "score": 3.1560234262234204}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3048379972639365, "2": 0.255380752602292, "4": 0.22334989528997304, "1": 0.10934166039684808, "5": 0.10707495240310677}, "score": 2.9634351876601315}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30054613780612877, "2": 0.2678175001569464, "4": 0.19680993754172488, "1": 0.1369130946577711, "5": 0.09790374273427217}, "score": 2.8509723047938933}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31411233571485536, "2": 0.275301532553549, "4": 0.19778648276904975, "1": 0.1242392048841498, "5": 0.08854943458820938}, "score": 2.8511037703520405}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31903843422209427, "2": 0.25857916094952993, "4": 0.21479081026801397, "1": 0.10867497849401093, "5": 0.09890685799872352}, "score": 2.936674790396231}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30914647044766097, "2": 0.2716825472453564, "4": 0.20224460465752114, "1": 0.12371855634018993, "5": 0.09319993077950885}, "score": 2.86952377676428}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3094453430591011, "2": 0.2591990965610158, "4": 0.20720567085086009, "1": 0.11984486071468595, "5": 0.10429533966465498}, "score": 2.916906727086624}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.27839926238626644, "3": 0.25061632374358456, "1": 0.21236493344909418, "4": 0.15688283909780362, "5": 0.10172681937749596}, "score": 2.657203981644443}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.26608073532307924, "3": 0.24890021644567237, "1": 0.20684122686560794, "4": 0.1679706360957377, "5": 0.11019692350836273}, "score": 2.708598303763449}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2854157470767152, "3": 0.24693984858694312, "1": 0.22804990326678126, "4": 0.14571105406359577, "5": 0.09387002183728445}, "score": 2.5919300657201862}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.28292899892702816, "3": 0.25707477065498113, "1": 0.2062583025066177, "4": 0.15690915055607443, "5": 0.0968174531321409}, "score": 2.6550945470937757}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2806697970739469, "3": 0.2543084699977507, "1": 0.21412673920265599, "4": 0.15541355785034283, "5": 0.0954730471619633}, "score": 2.6374333352271933}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3048983916530613, "2": 0.2564012701922397, "4": 0.21179316867375123, "1": 0.12634042873698081, "5": 0.1005530831881368}, "score": 2.9038158937440226}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3130731217222031, "2": 0.2977415353101611, "4": 0.17391141823529135, "1": 0.13849489683364988, "5": 0.07676870567963771}, "score": 2.7527149480866306}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30201487737183336, "2": 0.26605636344397277, "4": 0.1965012276715444, "1": 0.14011390220176453, "5": 0.09530185534914494}, "score": 2.8408188963301075}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3016603992901193, "2": 0.2599746117109476, "4": 0.20522227888800876, "1": 0.13010258816536813, "5": 0.10302842066782707}, "score": 2.891098057890109}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29550411992990355, "2": 0.2554635349183601, "4": 0.20980375189113093, "1": 0.1294742317846598, "5": 0.10973967597681089}, "score": 2.914869855178405}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2742034033514666, "2": 0.25497364298728153, "4": 0.19758116836627107, "1": 0.14895361950258934, "5": 0.12426278772317742}, "score": 2.8932231520299276}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2962661420750997, "2": 0.2517314838097529, "4": 0.21339046979324144, "5": 0.12428524403778592, "1": 0.1143105970363392}, "score": 2.9816079845508807}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2892190267171895, "2": 0.25344531478277016, "4": 0.2119513948864309, "1": 0.12560819252064911, "5": 0.11975722625528437}, "score": 2.946803145086835}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28481560730937333, "2": 0.2346214534530105, "4": 0.22590410136652883, "5": 0.14359667173061755, "1": 0.11104865948375181}, "score": 3.056379433904909}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29382086501906385, "4": 0.23707858749638522, "2": 0.23177138561041646, "5": 0.13531281944414175, "1": 0.10199794632185707}, "score": 3.07193827151476}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "human", "scores": {"4": 0.27380776675594437, "3": 0.2493870928206122, "5": 0.20328773291222696, "2": 0.18714604081470163, "1": 0.08635748465788834}, "score": 3.3205266720135618}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2743759589841983, "3": 0.25151128994814714, "5": 0.20888395927254622, "2": 0.182713833763496, "1": 0.08249077583113078}, "score": 3.344456821827456}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.29170869340457845, "3": 0.24658594130367606, "5": 0.24151647228406362, "2": 0.1589359957907986, "1": 0.06123755095068942}, "score": 3.493338111178506}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2674412133433438, "4": 0.2661354737599904, "2": 0.19923200082940162, "5": 0.18053159048236653, "1": 0.08664115892946485}, "score": 3.2546890637417247}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2866172434030469, "3": 0.2510575960095959, "5": 0.2198031732782793, "2": 0.17263939187189112, "1": 0.06987046159193486}, "score": 3.413848296475032}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29235156827498615, "2": 0.2897391626145474, "4": 0.1767434558119668, "1": 0.1475733261925006, "5": 0.09357671479552003}, "score": 2.7790075848424727}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2976003499847102, "3": 0.2744762068311697, "1": 0.19798571447631388, "4": 0.1502520292251176, "5": 0.0796674725563354}, "score": 2.6160081964101263}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2958610087417291, "3": 0.2948014500265846, "4": 0.16762747037157524, "1": 0.16271107451287523, "5": 0.07898476446400683}, "score": 2.7043096333013383}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.31603844860377595, "3": 0.28666069787091225, "1": 0.15970933054721909, "4": 0.1568767835370875, "5": 0.08070152554351225}, "score": 2.682818533722516}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2741004867125102, "2": 0.27093089245879404, "4": 0.18219473343139173, "1": 0.17268319604193302, "5": 0.1000762283384461}, "score": 2.7660465218925103}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.26563616692470365, "3": 0.2642097192761415, "1": 0.1930287958328824, "4": 0.1712565593156823, "5": 0.10585539651888354}, "score": 2.731270002957367}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26329450037338764, "2": 0.2540597762715146, "1": 0.19144253379830162, "4": 0.17549468876174587, "5": 0.1156840165454602}, "score": 2.769912244458514}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.28073152314885663, "3": 0.26113854206003595, "1": 0.21334493712549601, "4": 0.15017792817762687, "5": 0.09459144882314573}, "score": 2.63193367898343}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2744506542858032, "3": 0.2659311069963721, "1": 0.18485023912202153, "4": 0.17000675626267137, "5": 0.1047429212530364}, "score": 2.735336617055198}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.27556589381116703, "3": 0.27224431470864124, "1": 0.18530249150325948, "4": 0.17141012538014805, "5": 0.09546434996353027}, "score": 2.7161643084008738}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27102505730411774, "2": 0.2707383019848251, "1": 0.1851207988938908, "4": 0.1735394201373271, "5": 0.09956505792409609}, "score": 2.731686587164827}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27057014452132716, "2": 0.25317893177847683, "4": 0.19639337810496757, "1": 0.16255301244226134, "5": 0.11729736351538338}, "score": 2.8527020924001203}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27903378815363866, "2": 0.24097933404955904, "4": 0.21116275333883291, "1": 0.14443621320446703, "5": 0.12437743572208282}, "score": 2.930065131719595}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27507725321076437, "2": 0.24028386109038424, "4": 0.2101697587129602, "1": 0.1435892766924473, "5": 0.13087026369215868}, "score": 2.9444473390607877}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.27599431811962233, "3": 0.2715848677651901, "1": 0.17674858144650665, "4": 0.1763276794352911, "5": 0.09933645057596541}, "score": 2.7455070375052943}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "human", "scores": {"3": 0.25589691279403753, "2": 0.24724775213172903, "4": 0.1881212833412005, "1": 0.17975429290924358, "5": 0.12894821362350797}, "score": 2.8392563019458508}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2691222612089052, "2": 0.256870759987308, "4": 0.20497497099601816, "1": 0.14977309951890214, "5": 0.119243578466636}, "score": 2.887043437300152}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26137369867810356, "2": 0.2495320288213721, "4": 0.20344430440225728, "1": 0.1538357660278807, "5": 0.1317972265504107}, "score": 2.909833666005541}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26801658930372413, "2": 0.2400075974738858, "4": 0.2188647762321098, "5": 0.13746849711727635, "1": 0.13562693330575967}, "score": 2.982540033891122}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2712670551432336, "2": 0.24299578049754061, "4": 0.21592712769565692, "5": 0.1415072254431574, "1": 0.12828274575466858}, "score": 2.9993802941404066}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3106877159674212, "3": 0.28921853504526207, "5": 0.17578667376303297, "2": 0.17177877875917746, "1": 0.052513720535263576}, "score": 3.3854604621084348}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.32694762143917994, "3": 0.2841659160392981, "5": 0.18454421435704804, "2": 0.1595656887257397, "1": 0.04476648151753543}, "score": 3.4469419026377413}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.33599022893243824, "3": 0.27474238560115144, "5": 0.21727653106814465, "2": 0.13820633905440968, "1": 0.03377325709068585}, "score": 3.5647967964582703}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.35569366860621215, "5": 0.275256937317587, "3": 0.23625349950462565, "2": 0.10797036366765927, "1": 0.02481175862684391}, "score": 3.7486239725768127}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.33214761014646277, "3": 0.2604953938246842, "5": 0.229630886614935, "2": 0.138372867374477, "1": 0.03933965247280998}, "score": 3.5743650164278966}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3074377042697141, "2": 0.2553594547356583, "4": 0.2247173924060804, "1": 0.10648091625319162, "5": 0.10599581147898295}, "score": 2.968387452433518}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3026623655160451, "2": 0.2531439954965503, "4": 0.23102586616240953, "5": 0.11024710759117562, "1": 0.10291323751041839}, "score": 2.9925495554875328}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30713164875720766, "4": 0.248250267131258, "2": 0.22785983450811453, "5": 0.13135450050252434, "1": 0.08539546351771628}, "score": 3.112309437141943}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2946892994128569, "2": 0.2474674303940909, "4": 0.22612159351283648, "5": 0.1188215846005668, "1": 0.11288900495903838}, "score": 2.990519217287221}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2945054117494737, "2": 0.25640619314388763, "4": 0.21613445242896714, "1": 0.12366753295999526, "5": 0.10927785629271376}, "score": 2.930948315322113}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "human", "scores": {"3": 0.268382064469917, "2": 0.2290004523734353, "4": 0.22041919805150378, "1": 0.14123923842494965, "5": 0.1409440325037616}, "score": 2.9908281961286103}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29347515325783585, "4": 0.24353578165663706, "2": 0.22614463647723454, "5": 0.13485798732064402, "1": 0.10197591714468834}, "score": 3.083156160678637}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28616998258853366, "4": 0.24062607654424198, "2": 0.227956672723619, "5": 0.13408169508337547, "1": 0.11115720704091478}, "score": 3.058518869475537}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.285929471991997, "4": 0.2425661554087644, "2": 0.22363084499728184, "5": 0.14209202043927027, "1": 0.10577242783459663}, "score": 3.091575327063269}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2856712513827781, "2": 0.23637713967701515, "4": 0.2333329209419609, "5": 0.12935907685324452, "1": 0.11525202808423911}, "score": 3.0251700696691244}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2976082067376584, "2": 0.2541643433826579, "4": 0.2298703096916033, "5": 0.11118514435722092, "1": 0.1071633685531457}, "score": 2.983749377718464}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31229313406413156, "2": 0.27220410719275695, "4": 0.21099517775688606, "1": 0.11302936802611334, "5": 0.09146853002615091}, "score": 2.8956683843280597}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30871822849339897, "2": 0.2653749625711721, "4": 0.21968194131249438, "1": 0.10965963911021753, "5": 0.09655249779119901}, "score": 2.92809178065977}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3047701174006492, "2": 0.2517824645968548, "4": 0.2306540523204441, "5": 0.1094677493052324, "1": 0.10331947418049267}, "score": 2.991168083725705}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32332159530248034, "2": 0.2751824903854441, "4": 0.21628138732566055, "1": 0.10205695899883063, "5": 0.08314662196210679}, "score": 2.903277164136143}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2762215273164055, "2": 0.24514571258092363, "4": 0.20685353428474856, "1": 0.14578217841090807, "5": 0.1259872333226847}, "score": 2.9221171671786887}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27382520886621203, "2": 0.24290035049863998, "4": 0.21421247129449217, "1": 0.14101713093374516, "5": 0.12803271010678707}, "score": 2.945342616240782}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27872983489734543, "2": 0.2605362166512814, "4": 0.19844495938501197, "1": 0.14479494642780724, "5": 0.1174785752877628}, "score": 2.88327419501467}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27396451178917186, "4": 0.24143552952931757, "2": 0.21677916856239737, "5": 0.15849530619737334, "1": 0.10931676613509497}, "score": 3.12301451350576}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2728487136107516, "2": 0.2296884852638667, "4": 0.22286557321065462, "5": 0.14471771892615581, "1": 0.12986500384917055}, "score": 3.0228828500196876}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3175667965316161, "2": 0.2859274990854468, "4": 0.1814708398805273, "1": 0.13765712321302037, "5": 0.07736975786483416}, "score": 2.7749668135632417}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3000060613590134, "2": 0.26662742688261964, "4": 0.20548192605178, "1": 0.12501153074177881, "5": 0.1028636452826254}, "score": 2.8945577360726613}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32591916124714604, "2": 0.26067936850814605, "4": 0.2226699831139929, "1": 0.10204340673456583, "5": 0.08867951175001754}, "score": 2.9352622699220503}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31424419633116957, "4": 0.25038395982872497, "2": 0.22666085715660542, "5": 0.1273075584605938, "1": 0.08139637826682786}, "score": 3.1155462776558345}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3104746572817521, "2": 0.2582452149255335, "4": 0.2193128784544646, "1": 0.10869994400375001, "5": 0.10325875051309298}, "score": 2.950184850387909}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2924276188078375, "2": 0.2596315417979449, "4": 0.21141298153098928, "1": 0.13313955701860436, "5": 0.1033744237519635}, "score": 2.892249677938559}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28902543048015333, "2": 0.266937988597629, "4": 0.20297657513953213, "1": 0.13986170024729405, "5": 0.10118305265862364}, "score": 2.8586791358148362}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28544603129402935, "2": 0.23868430494965076, "4": 0.21067310758317423, "1": 0.14752249593764138, "5": 0.11765288996759542}, "score": 2.912247732954428}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3032279639743326, "2": 0.24971984736833427, "4": 0.22502762647089616, "1": 0.11341525192944962, "5": 0.10858632502403077}, "score": 2.965649135729107}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2797549045612739, "2": 0.24789733259572272, "4": 0.2190178818972854, "1": 0.12978013883730555, "5": 0.12353628010778063}, "score": 2.958632274950172}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3190410822520876, "2": 0.2872088579038733, "4": 0.18688216396001292, "1": 0.12983448915888254, "5": 0.07701922599874486}, "score": 2.794039859071457}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3274754462499706, "2": 0.3063506248965759, "4": 0.171151046415316, "1": 0.13574146433118206, "5": 0.059263409731035534}, "score": 2.711839123009049}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32138024276042987, "2": 0.2988539459553441, "4": 0.1689940959291145, "1": 0.14114842255630902, "5": 0.06959805899733254}, "score": 2.727032534848994}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.320520321184364, "2": 0.2922732285526801, "4": 0.1874241403946414, "1": 0.12333045501506432, "5": 0.07644030267319259}, "score": 2.801368312529199}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31989079725770275, "2": 0.28176361619704526, "4": 0.1881330224755382, "1": 0.13052785848775253, "5": 0.07966188806224797}, "score": 2.8046330076372845}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2791939995243034, "2": 0.2633703137728603, "4": 0.19068450937704637, "1": 0.16089343943364787, "5": 0.10584888661217934}, "score": 2.8172234721550304}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28909653948210007, "2": 0.252173256982823, "4": 0.21041670602735452, "1": 0.13572780942672352, "5": 0.11257963962594632}, "score": 2.911946576855805}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28317896388176145, "2": 0.25920521373187694, "4": 0.19646124374021623, "1": 0.15217034421655515, "5": 0.10897881210564075}, "score": 2.8508721571670366}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29234037142434227, "2": 0.24198130690576272, "4": 0.2213715870611784, "1": 0.12302914505643518, "5": 0.12126852225079415}, "score": 2.9758688157394104}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27417335230528667, "2": 0.23513010023655698, "4": 0.21967717426609054, "1": 0.14303094121420423, "5": 0.1279763369155439}, "score": 2.9544373143486906}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3008669315068767, "2": 0.25642788602542355, "4": 0.22063006368747468, "1": 0.11403318231529129, "5": 0.10803633211049898}, "score": 2.952208209410333}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2864478453677402, "2": 0.2349891349880996, "4": 0.23417035867102082, "5": 0.13661563228448662, "1": 0.1077698870973401}, "score": 3.056873120221795}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3130291380385272, "4": 0.25097631671983517, "2": 0.23305828651119476, "5": 0.1246003953101736, "1": 0.07833038441348548}, "score": 3.1104586572057484}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31055470796648926, "4": 0.25759298944749676, "2": 0.22753149741469259, "5": 0.12912997806385934, "1": 0.075182634416966}, "score": 3.1379573095681295}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2992000397582416, "2": 0.24242577449857314, "4": 0.23947168370447675, "5": 0.12620521581180913, "1": 0.0926908608247768}, "score": 3.0640750308878077}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2924327070926728, "2": 0.285691763314997, "4": 0.18241391789573397, "1": 0.14725124521759247, "5": 0.0922014427955748}, "score": 2.786620645606892}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.28482002198550027, "3": 0.26944111762008544, "1": 0.17967383492417194, "4": 0.17057963906865425, "5": 0.09546919967569006}, "score": 2.717345771339667}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30317551007395827, "2": 0.30143246035467, "4": 0.17837970973032438, "1": 0.13911343493409897, "5": 0.07788849705297674}, "score": 2.7544948233414854}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2979880779965528, "2": 0.26715859717983836, "4": 0.2118843228846535, "1": 0.11629495495233862, "5": 0.10666594900043826}, "score": 2.925467110234703}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2933385723656633, "2": 0.2766203473756239, "4": 0.19538252017546276, "1": 0.13378552780906885, "5": 0.10086495863485069}, "score": 2.8529198469792942}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2843385424128015, "2": 0.24510252171159425, "4": 0.21273604651032005, "1": 0.14539691957117848, "5": 0.11241361713191761}, "score": 2.9016657052298784}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2940406076273044, "2": 0.2518811826704551, "4": 0.20911776851459984, "1": 0.1353158910800061, "5": 0.10963315950491345}, "score": 2.9058700504971}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28626523580799573, "4": 0.25010298648658175, "2": 0.21931182575517452, "5": 0.14383452098830288, "1": 0.1004774454553039}, "score": 3.1175062501443462}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2812924228607548, "4": 0.2359025931611637, "2": 0.2298216512977143, "5": 0.1382402728758537, "1": 0.11473249393274405}, "score": 3.053097060766404}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28179125856363013, "4": 0.23955443546574018, "2": 0.22381501370232235, "5": 0.14735426876163144, "1": 0.10747510925911816}, "score": 3.095498687566074}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2806097962856453, "2": 0.2536326547300831, "4": 0.2035490034283871, "1": 0.15346262913493897, "5": 0.10873521198574224}, "score": 2.8604600207032433}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3007553305785399, "2": 0.27262760479719494, "4": 0.1978524357761603, "1": 0.13756325930520183, "5": 0.09119348690202815}, "score": 2.832483965703879}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29038199460575514, "2": 0.2677871045956593, "4": 0.2017769095615708, "1": 0.14283885103621222, "5": 0.097206256723893}, "score": 2.842723219176622}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2895424964988343, "2": 0.24997951611919725, "4": 0.21707002101551717, "1": 0.13103304967561968, "5": 0.11236597509805789}, "score": 2.9297557276455186}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2800550186323468, "2": 0.2488956367238233, "4": 0.2126453977259255, "1": 0.14383203267261377, "5": 0.11456184165499142}, "score": 2.9052084241701506}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2998032958135451, "2": 0.2542195284517288, "4": 0.21435786377508675, "1": 0.11655679663663412, "5": 0.11505196305745997}, "score": 2.9571282157705583}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2909712831539276, "2": 0.2898606757188737, "1": 0.16972399842083927, "4": 0.16677171129389431, "5": 0.08265755907785471}, "score": 2.702773766163671}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2937624298605807, "2": 0.2631130476987538, "4": 0.20614672632878864, "1": 0.13083255231663285, "5": 0.10613304822562228}, "score": 2.893633373246412}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30406490411061793, "2": 0.25909372763130917, "4": 0.20875983554038235, "1": 0.12161581017684249, "5": 0.10645096738395557}, "score": 2.919335232101993}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3011957480065999, "2": 0.26543701449100804, "4": 0.20496638272465895, "1": 0.12839659586917967, "5": 0.09999060974031707}, "score": 2.882715795144082}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.31318099399256805, "3": 0.256401424033048, "1": 0.21941174504669703, "4": 0.14039432618426348, "5": 0.07059820215738721}, "score": 2.5295799857878434}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2749306211149432, "2": 0.26514357692484286, "4": 0.18561623303158384, "1": 0.15792093225140846, "5": 0.11637810066522436}, "score": 2.837385279623728}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2752956411637905, "2": 0.2619149621113622, "4": 0.19851468534589192, "1": 0.1492890230369916, "5": 0.11497981359307945}, "score": 2.8679805287654645}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.282603478468989, "2": 0.26300774462357657, "4": 0.20105437200822746, "1": 0.13687462748306342, "5": 0.11645193106581164}, "score": 2.897200427948691}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.27331907319246335, "3": 0.2688836018237185, "4": 0.18103056401691195, "1": 0.1706538573529556, "5": 0.10610418396222271}, "score": 2.7786102136011492}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.27553734666333596, "3": 0.2697208617879984, "4": 0.1824650191905388, "1": 0.17472712634960846, "5": 0.09753209262595534}, "score": 2.7525332612015587}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27585729336730613, "2": 0.2670907475134271, "4": 0.18839301366217087, "1": 0.1639217498637806, "5": 0.10472399591712156}, "score": 2.8029041566541144}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28795406733095724, "2": 0.24592602491506257, "4": 0.22551391829840015, "5": 0.1224020696673366, "1": 0.11819323608153628}, "score": 2.9880054324084955}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27954516704425325, "2": 0.27297785617475306, "4": 0.1801082535958373, "1": 0.16701098337758433, "5": 0.1003386915675089}, "score": 2.7737815047367294}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28527507179271316, "2": 0.25621006617264297, "4": 0.21450680846976897, "1": 0.12822742933626777, "5": 0.11576960809194953}, "score": 2.933380365917496}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2847952152419347, "4": 0.2378686377294803, "2": 0.23193908649534226, "5": 0.13861211309185723, "1": 0.10677317013291558}, "score": 3.0696082569499357}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2809063610165496, "4": 0.25849694584924177, "2": 0.20961409115543286, "5": 0.16306028498793557, "1": 0.08791023868643968}, "score": 3.199185353118128}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2990904628539135, "4": 0.27037429559534026, "2": 0.21383146948342552, "5": 0.14523887184338646, "1": 0.07145440678650934}, "score": 3.2041138980820856}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2845069206649549, "3": 0.2834939773373361, "2": 0.19599296759748042, "5": 0.16976246223666716, "1": 0.06623238077850808}, "score": 3.2955774534626334}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.284633212858511, "3": 0.27847435679335764, "2": 0.18969848279327697, "5": 0.17937524977416652, "1": 0.06780648090735707}, "score": 3.3180761536949324}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28170515631210724, "2": 0.2711008193948932, "4": 0.19924819904951777, "1": 0.14885391354425065, "5": 0.09908113688620823}, "score": 2.8285999795353667}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2853335306438282, "2": 0.2727422142629833, "4": 0.1975772958133222, "1": 0.14447290466223883, "5": 0.09985666212640638}, "score": 2.835599737148546}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2737889841873944, "2": 0.2471298677904928, "4": 0.21647257801510872, "1": 0.13898152060183444, "5": 0.12361482472625267}, "score": 2.9386085679829073}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30128907290461265, "2": 0.269118358964409, "4": 0.20845297557314135, "1": 0.12330917001547703, "5": 0.09781685258169011}, "score": 2.888348466634242}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27755121618401263, "2": 0.2638952592038706, "4": 0.20235287494047718, "1": 0.14730009655717793, "5": 0.10888630658180516}, "score": 2.8616280644655627}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31457133758317385, "2": 0.2631893615475597, "4": 0.2223160635364171, "1": 0.10517904400449095, "5": 0.09473253302830564}, "score": 2.9382329598142647}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.32602259180540005, "2": 0.2674882068927906, "4": 0.23091317613527648, "5": 0.09350293993750039, "1": 0.0820651200446252}, "score": 2.986300499909192}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32026861930148637, "2": 0.2599720899694445, "4": 0.23154702368825106, "5": 0.09903366857972695, "1": 0.08916978767180088}, "score": 2.9913026189038665}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3279875593920757, "2": 0.25428537983698407, "4": 0.2401824586751033, "5": 0.09988167935354592, "1": 0.07765553892447648}, "score": 3.030349583792055}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32260339160551427, "2": 0.2888391558372058, "4": 0.20335478826336104, "1": 0.09662268799186437, "5": 0.08856792564055006}, "score": 2.898404883435166}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29096060470378665, "3": 0.2725408957479144, "1": 0.23042749991798353, "4": 0.13375810458684428, "5": 0.07229388005083037}, "score": 2.526521256953937}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.28747585640292944, "1": 0.2530060190060146, "3": 0.2528916861266012, "4": 0.12990341060896834, "5": 0.07669792687372246}, "score": 2.4897985633844986}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.28359784020255724, "3": 0.27586352781258516, "1": 0.2076251476315343, "4": 0.15067572016991426, "5": 0.08222512226102033}, "score": 2.616272978179101}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2854583913747782, "3": 0.2746320986749146, "1": 0.19773878242229892, "4": 0.15525285013182874, "5": 0.08690825126087655}, "score": 2.6481300092860662}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.28539725273552774, "3": 0.25886085526652924, "1": 0.23257528498072133, "4": 0.14051569335065178, "5": 0.08262648567780675}, "score": 2.555209976683603}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2928872372040513, "2": 0.2587088191790338, "4": 0.21429026596558703, "1": 0.12488168623792145, "5": 0.109218316087214}, "score": 2.9242536706293767}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2953176861151939, "2": 0.2485122099611515, "4": 0.22152852871063342, "5": 0.11851031212988977, "1": 0.11611265446090371}, "score": 2.9778112211848518}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2963879917633, "2": 0.26146720877340424, "4": 0.20443136158708497, "1": 0.13371897269071778, "5": 0.1039794807279391}, "score": 2.8834834229504205}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29505839295793723, "2": 0.2533196624092504, "4": 0.22432306762746276, "1": 0.11540137614260426, "5": 0.11188221643729501}, "score": 2.9639645350262156}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2901680909364167, "2": 0.2760803313493136, "4": 0.1880142163740983, "1": 0.15591029019456723, "5": 0.08980898975987019}, "score": 2.7797273013197588}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29059399273412617, "2": 0.25023404977023145, "4": 0.2307159912484211, "5": 0.12414022568630685, "1": 0.1043077098254753}, "score": 3.020147134996163}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2795726476848251, "4": 0.2614047778584971, "2": 0.20307459589031474, "5": 0.17258698650805554, "1": 0.08335467354762877}, "score": 3.236796304089012}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2905443635186228, "4": 0.27373100182109283, "2": 0.21304250056666021, "5": 0.14981895208204166, "1": 0.07285579518142594}, "score": 3.214616400390562}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2823885555096302, "3": 0.27696628361630143, "2": 0.19586804231175353, "5": 0.17761309820309434, "1": 0.06715969420595722}, "score": 3.3074286511756137}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2844998365308283, "4": 0.2347800876978032, "2": 0.23241202794186253, "5": 0.13976694808343365, "1": 0.10853072134967014}, "score": 3.0648411861710008}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3089791438479583, "2": 0.27639294832125, "4": 0.20765531775729168, "1": 0.12025368812360814, "5": 0.08671036952352232}, "score": 2.8641745733154176}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29199847480442903, "2": 0.2454075698982396, "4": 0.23431788561426992, "5": 0.12497598251763292, "1": 0.10328829706804792}, "score": 3.0322860672710776}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29346203521167574, "4": 0.2723476510329005, "2": 0.21210496689113484, "5": 0.1476213838908776, "1": 0.07445726070701605}, "score": 3.2065723150121737}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3059034346110345, "4": 0.2895589140238182, "2": 0.19724633498232574, "5": 0.1475701534000951, "1": 0.05971226713759096}, "score": 3.2680307359264194}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3080269499496266, "4": 0.2742775031214803, "2": 0.20945962059227843, "5": 0.14298896779285877, "1": 0.06523900843973636}, "score": 3.2203195527988093}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2655251807627196, "2": 0.26255386972625816, "4": 0.18942488845990615, "1": 0.171201320860089, "5": 0.11128390948718654}, "score": 2.807034106031394}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2689033923850965, "2": 0.2396237725519564, "4": 0.21426868802227195, "1": 0.1413226224276668, "5": 0.1358645833441604}, "score": 2.9637282228133737}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2609684657082712, "2": 0.2524862215182949, "4": 0.19996900488881053, "1": 0.16221403695754516, "5": 0.12435294821586323}, "score": 2.8717594103371686}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2707218686686508, "2": 0.23838546848265826, "4": 0.21611305617730858, "1": 0.14062557741073342, "5": 0.13413851753456854}, "score": 2.964752921199289}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.273599040550434, "2": 0.2443435138803271, "4": 0.212911370671542, "1": 0.13971940745481512, "5": 0.1294134449592774}, "score": 2.9479552436392016}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2776221118176131, "2": 0.2769282587560273, "1": 0.18244863456749608, "4": 0.16961736040233938, "5": 0.0933699705404907}, "score": 2.7145278729251276}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28922510038052385, "2": 0.27636608423228903, "4": 0.18083025598046173, "1": 0.1622786434493605, "5": 0.09129122570475433}, "score": 2.7624872722133578}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.284983156631081, "2": 0.2527340320327881, "4": 0.1992267610966826, "1": 0.14592708497557622, "5": 0.11711867992088064}, "score": 2.888874775993459}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27904486601492245, "2": 0.2542303075882512, "4": 0.19576010959582052, "1": 0.15749820777303794, "5": 0.11345317298632114}, "score": 2.8534377778742375}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2825452681482932, "2": 0.27634303626197776, "4": 0.1714727529371763, "1": 0.1713236707818999, "5": 0.09829963155548278}, "score": 2.749077713718724}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2659190074062716, "2": 0.2461005221226536, "4": 0.18893130416881454, "1": 0.1758143799260063, "5": 0.1232258781526225}, "score": 2.837652332270063}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.27185367962073037, "3": 0.2595991158434173, "1": 0.18363655854539612, "4": 0.1772795701715492, "5": 0.10761907177298634}, "score": 2.7533879566637065}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2689679100475138, "2": 0.25678711080378913, "1": 0.17935829961397054, "4": 0.17766473783619902, "5": 0.11721012673303502}, "score": 2.7965788778570007}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2725608464716707, "3": 0.2681499875452916, "1": 0.19136784749385913, "4": 0.16654034276872792, "5": 0.10137274610871351}, "score": 2.7139869397503276}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2739038901507446, "3": 0.25900862931994517, "1": 0.18965132961183784, "4": 0.1744229817673576, "5": 0.10300685907588061}, "score": 2.7272284293358386}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.28711659252105626, "3": 0.27009020045915516, "1": 0.2332946108216892, "4": 0.1335147393660411, "5": 0.07595349757350087}, "score": 2.5317017031595324}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2905208594303674, "3": 0.2705566975193053, "1": 0.2049339596076481, "4": 0.14937399266266566, "5": 0.08459671863013726}, "score": 2.6181718653704413}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2973394688908542, "3": 0.2850810366521058, "1": 0.19425271752491205, "4": 0.14834079253433752, "5": 0.07496884138262644}, "score": 2.6124269271878475}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.28316030300292433, "3": 0.2783309237562607, "1": 0.18711933698004132, "4": 0.16070321503471457, "5": 0.09066968603972629}, "score": 2.684638395588269}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.309121894280176, "3": 0.26109039255240113, "1": 0.2356246043340872, "4": 0.12517987200171052, "5": 0.06896757585324326}, "score": 2.482735819896704}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2651996872419824, "2": 0.25062860424431777, "4": 0.19369773538308982, "1": 0.17048409006743645, "5": 0.11997684657796892}, "score": 2.8420525850806997}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27606061991736175, "2": 0.25004681966358716, "4": 0.20219574826312595, "1": 0.1474796616246644, "5": 0.12420383901708935}, "score": 2.905596026724561}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2790671625904534, "2": 0.27891282532973066, "4": 0.18298181548729864, "1": 0.16814654300536025, "5": 0.09087727582279495}, "score": 2.749526854548573}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28034452100877166, "2": 0.26171734328868657, "4": 0.2029644375032577, "1": 0.14618282713828976, "5": 0.10878000924492133}, "score": 2.8664400077237637}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2763821968446779, "2": 0.252026408834306, "4": 0.20102841756419665, "1": 0.1530598435115914, "5": 0.1174914398960813}, "score": 2.877863773317328}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30717176276992336, "2": 0.2564265526038831, "4": 0.22360843830920696, "1": 0.10961555383327024, "5": 0.103171853555443}, "score": 2.954294218276888}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3357641164283293, "2": 0.27649509438597797, "4": 0.21624462261490413, "1": 0.0913592904164362, "5": 0.08013110285217698}, "score": 2.9172926756060322}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33403616948410497, "2": 0.27338013949426654, "4": 0.21753857235850135, "1": 0.09430947662116074, "5": 0.08073089009959387}, "score": 2.9170008654139963}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3244490065080297, "4": 0.2585924005415012, "2": 0.22861824932264851, "5": 0.11583178148348751, "1": 0.07250379309053025}, "score": 3.1166306842227756}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3187126391146209, "4": 0.24740351781148548, "2": 0.24620407839384487, "5": 0.10461485711598092, "1": 0.08306062633950927}, "score": 3.0443080906634696}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28767140646476924, "4": 0.24201547707865523, "2": 0.22977286533995644, "5": 0.13483093752157307, "1": 0.1057019117186861}, "score": 3.070501185185529}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27810403741341777, "4": 0.2348553702610692, "2": 0.22832448088187351, "5": 0.1468891438745202, "1": 0.11181729883978397}, "score": 3.076675320801592}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2900501905832346, "4": 0.24279524597320412, "2": 0.22900656676714048, "5": 0.13921353522460064, "1": 0.09892299102287547}, "score": 3.094370850083644}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2992864013510943, "4": 0.2555556205691822, "2": 0.22693721174589132, "5": 0.13693604321547115, "1": 0.0812728716625512}, "score": 3.1399464104978305}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2991524707337577, "4": 0.2411477169152623, "2": 0.23699645399626837, "5": 0.1263650675227881, "1": 0.09632693504130059}, "score": 3.064228257244611}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27592855650942144, "2": 0.2507915156355345, "4": 0.2051313240134151, "1": 0.14876232215060708, "5": 0.11937141643792505}, "score": 2.8955564443726276}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28024711821243714, "4": 0.24784988958670467, "2": 0.22300247699116665, "5": 0.1442954565266237, "1": 0.10459353878051286}, "score": 3.104252449065814}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.28307582057391356, "3": 0.2786446123450262, "4": 0.17908482548473892, "1": 0.16280562083438013, "5": 0.09637820424239736}, "score": 2.7631515861665212}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2862069581388532, "2": 0.24494310987326265, "4": 0.21945170356358262, "1": 0.12717082723711612, "5": 0.12221201679110458}, "score": 2.964590428043417}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28878693843842557, "2": 0.2576836523716893, "4": 0.22185392703648538, "1": 0.12049732806882076, "5": 0.11116730057355355}, "score": 2.9455096282624114}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2932241926279393, "4": 0.25091847334553624, "2": 0.2170843264012594, "5": 0.14545831911115228, "1": 0.09329773947370576}, "score": 3.1381576478587254}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2936495880133351, "4": 0.24663666924899255, "2": 0.2241629581230718, "5": 0.13840764484565443, "1": 0.0971266968171583}, "score": 3.1050373343067372}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29703936704209266, "4": 0.238346662487283, "2": 0.23350714564672326, "5": 0.1333623792355842, "1": 0.09772961930636746}, "score": 3.076106165070455}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30407244501374664, "4": 0.24180472501195444, "2": 0.23412882053393425, "5": 0.12511401968032845, "1": 0.09486817335050894}, "score": 3.068168402643422}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2944948097454879, "4": 0.2403812198011874, "2": 0.23404728766551558, "5": 0.13020930301918113, "1": 0.10085485247232263}, "score": 3.0650436480504406}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3280914495022658, "3": 0.25732602970593543, "1": 0.22280037228329402, "4": 0.12878447606777557, "5": 0.0629814840347014}, "score": 2.4810468490440076}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.30164392908195886, "3": 0.28351745161048114, "1": 0.17280703701066677, "4": 0.15934281955101293, "5": 0.08267857330016681}, "score": 2.677438676326957}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2907708729890646, "3": 0.2809579963508463, "4": 0.17047173041894925, "1": 0.1619266700890004, "5": 0.0958595384592386}, "score": 2.747563264102464}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.3088382505935984, "3": 0.27079632742014376, "1": 0.19291100700871236, "4": 0.1480923667833301, "5": 0.07934905034565395}, "score": 2.6121251613252006}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.3151211849541045, "3": 0.278238839289805, "1": 0.1808270733959633, "4": 0.1496400852203322, "5": 0.0761625200617782}, "score": 2.62518593410818}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28967421037570723, "2": 0.2671374123430719, "4": 0.1927064177032276, "1": 0.14580242896185752, "5": 0.10465502646964185}, "score": 2.843270359849662}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2890343904073764, "2": 0.25401549751151653, "4": 0.21246957018522342, "1": 0.13136793875528066, "5": 0.11308802287599776}, "score": 2.921892321007724}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28594608497692225, "2": 0.27297187802516376, "4": 0.1801541510259378, "1": 0.15908346140252988, "5": 0.10181455588186758}, "score": 2.7926382683366704}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29082516497905125, "2": 0.2416471680455851, "4": 0.22460798167965296, "5": 0.13166249326144452, "1": 0.11122804786146777}, "score": 3.0238303989512865}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28856875573198465, "2": 0.26355442126779155, "4": 0.19663595577903858, "1": 0.14025063597619317, "5": 0.1109653820206892}, "score": 2.874507908219102}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28424191216547623, "2": 0.265015384490471, "4": 0.20394488361510435, "1": 0.13413252167684314, "5": 0.11265140949732036}, "score": 2.895965829881317}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27548841557577775, "2": 0.2499262511598952, "4": 0.21964857415990843, "5": 0.127749201552006, "1": 0.12717375219977956}, "score": 2.970872819593469}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2931880696326297, "4": 0.2507588647058204, "2": 0.22649380169918604, "5": 0.1383217065483417, "1": 0.09122351273989804}, "score": 3.1184631143993586}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27944910387974065, "4": 0.24367753636751624, "2": 0.22286211882104145, "5": 0.15305217540551913, "1": 0.10094100921023295}, "score": 3.125040007698932}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29410930353661596, "4": 0.242509377317918, "2": 0.23626488719774297, "5": 0.13264461430688088, "1": 0.09445787604488728}, "score": 3.08261911848653}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "human", "scores": {"2": 0.28502023535167714, "1": 0.24785241766847166, "3": 0.23156913748493024, "4": 0.14306072335637846, "5": 0.09248575928421543}, "score": 2.547301862511077}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2705723090911416, "1": 0.23153076965771127, "3": 0.2291369085823608, "4": 0.1533018538841093, "5": 0.11543438565631652}, "score": 2.6505284687586075}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.259258459950977, "3": 0.23705782032173608, "1": 0.2109574340958565, "4": 0.17394571694870933, "5": 0.11876715302172983}, "score": 2.7303030766869854}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2705515840460446, "3": 0.23191345864224946, "1": 0.22588277702588455, "4": 0.1622460611691263, "5": 0.10938238681396809}, "score": 2.6586855965225005}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2872984810480228, "3": 0.24319120334517177, "1": 0.22576826090767046, "4": 0.15244896418929216, "5": 0.0912779711810837}, "score": 2.5961637979557923}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2581108590781099, "2": 0.2437390483401798, "4": 0.19031648158429118, "1": 0.172385160576431, "5": 0.1354275050387331}, "score": 2.8726594549723243}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2741578071169212, "2": 0.24714061817356087, "4": 0.20365518191730964, "1": 0.1441715166992036, "5": 0.13085843355505117}, "score": 2.929887244623802}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2754334611187597, "2": 0.24218666673946937, "4": 0.2110843209456866, "1": 0.13919870977256857, "5": 0.13208411823542618}, "score": 2.954667894363026}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27638855370830895, "4": 0.2303352321821138, "2": 0.22773513816720703, "5": 0.1498042555637184, "1": 0.11572443203059307}, "score": 3.070760617688318}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2735765516336079, "2": 0.2407117787484712, "4": 0.2097076208617472, "1": 0.1400050759842144, "5": 0.13598724287982894}, "score": 2.9609597179662077}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28002595043007855, "2": 0.2506490814377665, "4": 0.2035890047375607, "1": 0.1499211034890255, "5": 0.11580390412885866}, "score": 2.8847042614250933}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2965161183394987, "2": 0.23794360194722114, "4": 0.23354037607783784, "5": 0.12839962606459837, "1": 0.103589842430627}, "score": 3.045216813242346}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3021468867151856, "2": 0.26725163800084323, "4": 0.2017475128074532, "1": 0.13209313988878763, "5": 0.09674783737841032}, "score": 2.86380350124581}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.292095113087664, "2": 0.23569509019387833, "4": 0.2319232687890332, "5": 0.13166614036302, "1": 0.10860845717225998}, "score": 3.042344050157883}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2779185204938561, "4": 0.23719454727552627, "2": 0.2276075283882457, "5": 0.14511557283586482, "1": 0.11215329927901428}, "score": 3.075512361276593}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3161115883627266, "2": 0.26969440346925877, "4": 0.21409263152984928, "1": 0.1151979645169667, "5": 0.08489581331617713}, "score": 2.883793042625}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3254935282563965, "2": 0.289960259963598, "4": 0.1952289903291651, "1": 0.11796849284005338, "5": 0.07133851607575985}, "score": 2.8120068569504224}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3278550463953796, "2": 0.27143716577570953, "4": 0.21793873234116126, "1": 0.09949815278149723, "5": 0.0832633085862831}, "score": 2.914031225317835}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.34308978576233834, "4": 0.27009003840508344, "2": 0.2238249736920402, "5": 0.10396524691135439, "1": 0.05902389010495858}, "score": 3.136148604084031}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3153918326502885, "4": 0.2588771640141312, "2": 0.22937609186734995, "5": 0.1171685948240098, "1": 0.0791777780269202}, "score": 3.1054836064251075}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27032641654740514, "2": 0.252220039460934, "4": 0.20396201570486572, "1": 0.14781901871872316, "5": 0.12565833275510235}, "score": 2.9074192918173054}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.29494419795789145, "3": 0.2940393138514772, "4": 0.1763451191051647, "1": 0.15570387700040686, "5": 0.07895851429131939}, "score": 2.7279077529410256}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2941533644103628, "2": 0.2674738431617501, "4": 0.19690149513374308, "1": 0.13795133513054514, "5": 0.10350598933292836}, "score": 2.8605350116560926}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2912762935190676, "2": 0.26989415914601356, "4": 0.18989606173586165, "1": 0.15086996079344142, "5": 0.09805132626658537}, "score": 2.8143623690282493}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2769999924641593, "2": 0.2638498203526331, "4": 0.18835791931286577, "1": 0.1673386626432553, "5": 0.10343610499033196}, "score": 2.7966994258462057}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29908717287691694, "2": 0.2618809939436597, "4": 0.22025813049509232, "1": 0.11589708267567901, "5": 0.102868294824471}, "score": 2.9323189973922044}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31902194036141496, "2": 0.2564582232387511, "4": 0.23401391490182907, "5": 0.09688379580730855, "1": 0.0936148925233034}, "score": 2.984093383175866}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3204796497362637, "4": 0.2475572773775649, "2": 0.2465028065415771, "5": 0.10331321321006666, "1": 0.08213989079114155}, "score": 3.043401426529758}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3042127459905638, "4": 0.2672962460216614, "2": 0.22277490765607322, "5": 0.12755463453619112, "1": 0.0781548315476067}, "score": 3.14332189517574}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3128635894159761, "4": 0.24859875697962144, "2": 0.24325069518906592, "5": 0.10963729275293803, "1": 0.08564184258674427}, "score": 3.0533393794009434}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2629655615645108, "2": 0.2572603427558474, "4": 0.19492355946795126, "1": 0.16215676929229678, "5": 0.12268212725726604}, "score": 2.858712288100813}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2613375793288508, "2": 0.2545689388767363, "4": 0.19545822602705534, "1": 0.16509224511418708, "5": 0.1235316846436368}, "score": 2.8577665552718674}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2637864776153663, "2": 0.26349987114872125, "4": 0.18904900723398085, "1": 0.16543521681196022, "5": 0.11821970250990102}, "score": 2.8311164651427956}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27237434241055786, "2": 0.2554536231254953, "4": 0.20659465373565217, "1": 0.1410194718375481, "5": 0.12454969326784786}, "score": 2.918200801439387}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2704860102899322, "2": 0.23368374379452103, "4": 0.22784201656574665, "5": 0.1449810695372666, "1": 0.1229997200043142}, "score": 3.03812125545196}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.30131977582542885, "3": 0.2874127911185493, "1": 0.17775206374258967, "4": 0.16206441489048018, "5": 0.07144016734224452}, "score": 2.6481170504745846}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.30659669258395955, "3": 0.30399613240768086, "4": 0.1720314104407337, "1": 0.1424358294994107, "5": 0.07493209316925721}, "score": 2.730425131217585}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3128705976388708, "3": 0.30215166067370985, "4": 0.15911071473364932, "1": 0.15817812619355584, "5": 0.0676796591430029}, "score": 2.66524008927072}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3053898261342146, "2": 0.28837449894547557, "4": 0.19219667159493062, "1": 0.12827329166469395, "5": 0.08575669673074979}, "score": 2.8187873491622155}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.29796891797913877, "3": 0.29382027737792143, "4": 0.18090283772473958, "1": 0.14695295168456793, "5": 0.08034806252762816}, "score": 2.7497224013251587}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30491632020558473, "2": 0.25319609789197606, "4": 0.20319052363902596, "1": 0.12996852152020089, "5": 0.10870321592130663}, "score": 2.9074614713976596}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2961045433561228, "2": 0.23394149880213647, "4": 0.20851047483258783, "1": 0.1318022217599556, "5": 0.12961609667983295}, "score": 2.9701959758647742}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2983862770942715, "2": 0.2693007484300624, "4": 0.1956364869849014, "1": 0.1415052868074485, "5": 0.09515612645280841}, "score": 2.8336349100198435}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29728089878482755, "2": 0.22752574094062766, "4": 0.2257460915529825, "5": 0.13315984903330627, "1": 0.11626997747869154}, "score": 3.032000651883661}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30259569634080113, "2": 0.27097562684186066, "4": 0.20019703948451353, "1": 0.13666972912107028, "5": 0.08955141046618126}, "score": 2.834983043026846}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3014482256846063, "2": 0.2754971211472572, "4": 0.19499189215014776, "1": 0.13426682870056184, "5": 0.09378449829565517}, "score": 2.8385282639217313}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3051310263603435, "2": 0.24448341614388022, "4": 0.22932377714751562, "5": 0.11729075985971214, "1": 0.10375620649728451}, "score": 3.011909644157855}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3138759923187584, "2": 0.258737511578045, "4": 0.21834058911050191, "1": 0.10581789859504638, "5": 0.10321611345428977}, "score": 2.9543989648292133}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29522874982261404, "4": 0.24324305723715342, "2": 0.22850220929672052, "5": 0.13276479167769742, "1": 0.10024899878774439}, "score": 3.079773406411688}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30623766361745425, "2": 0.2768595613772921, "4": 0.1946542638404815, "1": 0.13465571732328493, "5": 0.08758271656431658}, "score": 2.8236469237864235}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2754766800192433, "2": 0.26965222656287624, "4": 0.1808026633887674, "1": 0.16848933920573, "5": 0.1055647046339865}, "score": 2.785298078939904}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27891954720981943, "2": 0.26781000137192545, "4": 0.19341614879340335, "1": 0.15393385220188968, "5": 0.10590853867730547}, "score": 2.829553490056835}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28734146411584083, "2": 0.26476993496952683, "4": 0.18933517913957268, "1": 0.15426140199472257, "5": 0.10427719385428463}, "score": 2.824594227336155}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2878131770890598, "2": 0.2600849943606787, "4": 0.1981386779028282, "1": 0.14450833376189212, "5": 0.10944030918024496}, "score": 2.86791571813902}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2866495469866512, "2": 0.256012706748003, "4": 0.1977113381839729, "1": 0.1500223343954679, "5": 0.10958713420492534}, "score": 2.860825873517417}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.274535829538085, "2": 0.2686292776237865, "4": 0.18144325840911044, "1": 0.16922181666865546, "5": 0.10615534912168156}, "score": 2.786677959211845}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2906159043472358, "2": 0.27034287992747774, "4": 0.19233723795930702, "1": 0.1398438690172776, "5": 0.10684862134652859}, "score": 2.8560022085297883}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28338099915601683, "2": 0.2742843052879042, "4": 0.17785323344691054, "1": 0.16888822050872393, "5": 0.09557311713366942}, "score": 2.7569338298318318}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29400797093122794, "2": 0.2651261310514567, "4": 0.19312284306267588, "1": 0.1435325844816952, "5": 0.10419706677615691}, "score": 2.8493236569801272}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2902165530540773, "2": 0.27638780746022135, "4": 0.1890587056968154, "1": 0.1502124129886413, "5": 0.09411230272213919}, "score": 2.8004682398089598}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2882484203461816, "2": 0.2377501848641624, "4": 0.2211915966242973, "5": 0.12675994221766088, "1": 0.12603380681037116}, "score": 2.9848934401274607}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2979060531699158, "2": 0.24323707353154528, "4": 0.22462224473933695, "5": 0.1185496996504846, "1": 0.11566002616831679}, "score": 2.9871641985254955}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28977170214956965, "2": 0.23998875761695815, "4": 0.2274765324449529, "5": 0.1256206534714001, "1": 0.11713152854480209}, "score": 3.0044660730298802}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2836212379895194, "4": 0.2498741469685791, "2": 0.23198213838488757, "5": 0.1304259038579917, "1": 0.1040889663346784}, "score": 3.0705664203912795}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2856433712292168, "4": 0.2360598746477387, "2": 0.2351606456204574, "5": 0.12618829282708027, "1": 0.11693748537671263}, "score": 3.0194010443466013}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29400361964545774, "3": 0.2518221234580822, "1": 0.22156016524332794, "4": 0.1506178718009667, "5": 0.08197751308473125}, "score": 2.577441043126182}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3187302962839269, "3": 0.2567810250213799, "1": 0.2113073225931738, "4": 0.142847393054908, "5": 0.07031754064356627}, "score": 2.5421300135463065}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.33089830052002167, "1": 0.2641998644374064, "3": 0.23243224866788229, "4": 0.11467451131340278, "5": 0.057771170962913586}, "score": 2.3709037858666067}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.32309211844374036, "3": 0.24549470505112805, "1": 0.2324731835910869, "4": 0.1319078112515307, "5": 0.06701422960345135}, "score": 2.4778884118544515}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.3260848028506615, "1": 0.24896810079030682, "3": 0.23295296796947523, "4": 0.12573270679198248, "5": 0.06624195204903824}, "score": 2.4341845902882024}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2702433309778648, "2": 0.25236770706073797, "4": 0.203872516418228, "1": 0.14784914730473667, "5": 0.1256530049547437}, "score": 2.907111196971491}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29854828513048154, "2": 0.2792053629513282, "4": 0.1950476483020756, "1": 0.13861056064488433, "5": 0.08857802295960934}, "score": 2.8157753456245542}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2829273013581273, "2": 0.27892370314203446, "4": 0.18058646237007517, "1": 0.1671573156663823, "5": 0.09039452297311805}, "score": 2.7481344802681638}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2864317760943624, "2": 0.2823403558971587, "4": 0.1811958297976224, "1": 0.16505497149359044, "5": 0.08496770804730114}, "score": 2.7386785013862247}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2834454756672499, "2": 0.2795560974739732, "4": 0.18234517904472924, "1": 0.1593616231131083, "5": 0.0952743170924188}, "score": 2.7746105685773332}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3110536729066506, "2": 0.24336867605331192, "4": 0.21500611702072878, "5": 0.1211125621635517, "1": 0.10941232887062258}, "score": 2.995037676095675}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30413089335438387, "2": 0.26897519917664336, "4": 0.1898590545998919, "1": 0.13751410298108452, "5": 0.09947139137796916}, "score": 2.844790771320748}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3169767029743562, "2": 0.2569488091792641, "4": 0.20343584129522796, "1": 0.11500254734938459, "5": 0.1075993362450264}, "score": 2.9316780981921267}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3132527206525815, "2": 0.25394796376973705, "4": 0.21625043967349153, "5": 0.11714464801067549, "1": 0.09937956201422046}, "score": 2.9978325944357005}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30827630623347163, "2": 0.26047851427006785, "4": 0.1968457798946984, "1": 0.12589193484395617, "5": 0.10846209737303686}, "score": 2.901503122137035}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29359127499583004, "3": 0.28687775348746625, "1": 0.1959671374265967, "4": 0.1513923905212241, "5": 0.07215692628238148}, "score": 2.6101750340362475}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2841259367075233, "2": 0.2756638749015238, "1": 0.17707585126221062, "4": 0.1742401254175592, "5": 0.08888373602939871}, "score": 2.72218910979193}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2904570390084806, "2": 0.280459962610094, "1": 0.1726513044009078, "4": 0.16978504214567533, "5": 0.08663572669910218}, "score": 2.717290835495973}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2843187531389243, "2": 0.27395390956772, "1": 0.17966131209430344, "4": 0.17285935361848903, "5": 0.08919837116901044}, "score": 2.717977221295053}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29643627729990835, "2": 0.2708856507775389, "4": 0.18568774617709516, "1": 0.15886957442759006, "5": 0.0881124446549827}, "score": 2.7732859526171785}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29339551490865445, "3": 0.2620036877338653, "1": 0.20270728223456008, "4": 0.15638629227695663, "5": 0.08549295535010348}, "score": 2.628556824035414}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.30495943842164785, "3": 0.26217989203756864, "1": 0.20977893357531455, "4": 0.14212963717543595, "5": 0.08093361728559097}, "score": 2.5794717941804373}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2729369125671742, "3": 0.257240585920196, "1": 0.18950012402014538, "4": 0.17305003615028441, "5": 0.10726123193401303}, "score": 2.7356324024432928}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.26923757788467545, "3": 0.25931565867602957, "1": 0.18668725413380877, "4": 0.17855151856379453, "5": 0.10619362502385679}, "score": 2.7483230669394096}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.29117573317765755, "3": 0.26934130817684826, "1": 0.1888388449266696, "4": 0.16202599397268944, "5": 0.08860646992969833}, "score": 2.6703816708080605}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2854311028569747, "2": 0.23721860002207365, "4": 0.2315701332343623, "5": 0.12456177517405785, "1": 0.12120656986610638}, "score": 3.0010619563792913}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.299750654976801, "4": 0.27053729929952763, "2": 0.2153265426599092, "5": 0.13888321206351933, "1": 0.07549363733401826}, "score": 3.1819914809921532}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30801157978831284, "4": 0.2554255758574993, "2": 0.22924779183923, "5": 0.12302995705147211, "1": 0.08427572627345056}, "score": 3.103687217039553}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3122166003965565, "4": 0.2642565942380272, "2": 0.22742353658715042, "5": 0.12168066084965877, "1": 0.07441268904539199}, "score": 3.1313703043061163}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.305632952084837, "2": 0.2584184264048003, "4": 0.23749566697254432, "5": 0.10438440417391735, "1": 0.09405914428977247}, "score": 2.999727757775303}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2579818617052365, "2": 0.24376130273119073, "4": 0.19017999750309614, "1": 0.17261543118720926, "5": 0.13544038480688556}, "score": 2.87206591257238}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26936269472575225, "2": 0.2560158557236622, "4": 0.19391995658154712, "1": 0.15982057487929874, "5": 0.12086483788679378}, "score": 2.8599903754896987}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2754792144163577, "2": 0.24202230201133995, "4": 0.21122932232940705, "1": 0.13907347338499385, "5": 0.13218291446099706}, "score": 2.955425333100161}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2690765681284043, "2": 0.2602652436759251, "4": 0.19436905144797917, "1": 0.16002671643000518, "5": 0.1162480510286683}, "score": 2.8465442719196723}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2704020103809973, "2": 0.24947164937660485, "4": 0.2041202700073317, "1": 0.14857418250239654, "5": 0.12741884842067916}, "score": 2.9123368093996}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3029037138642033, "2": 0.25502864673401476, "4": 0.22202157880707024, "1": 0.11368774132514392, "5": 0.106344622796616}, "score": 2.952306041776991}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2977287624722756, "2": 0.2510233038841864, "4": 0.23285528797963445, "5": 0.1107454228033891, "1": 0.1076356140955628}, "score": 2.988051462803341}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30855344782332045, "2": 0.2520194782033597, "4": 0.22434150774150005, "1": 0.10834922540859376, "5": 0.10672274239931326}, "score": 2.969068642901873}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2869755093898518, "4": 0.26303580904713836, "2": 0.2112024767886093, "5": 0.15160004635532512, "1": 0.08717340352831893}, "score": 3.18068892258001}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3005769754218103, "4": 0.2401931950709627, "2": 0.23820038637522867, "5": 0.12163810439805088, "1": 0.09938063531928606}, "score": 3.046508244650291}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2873883908083911, "3": 0.2571498731636769, "1": 0.1955442465696388, "4": 0.1698444773109735, "5": 0.09006482411282907}, "score": 2.6714945517750226}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2786971418051993, "3": 0.26604274170688386, "4": 0.1895813801393175, "1": 0.16417229883536624, "5": 0.10149727785728335}, "score": 2.785532231926984}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2871284506811967, "3": 0.2670324746701181, "4": 0.1887093647732293, "1": 0.16248351963276259, "5": 0.09463779106306738}, "score": 2.765887490599624}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.29461858246737066, "3": 0.26142467151903626, "1": 0.18365022161361172, "4": 0.17135756195570714, "5": 0.08894103116740684}, "score": 2.6873181186293538}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2929883007333431, "3": 0.2574058903626933, "1": 0.185492709424649, "4": 0.17199764398914982, "5": 0.09210850451252178}, "score": 2.6922387941902914}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3142659742085701, "2": 0.2632344497468868, "4": 0.22098766356395771, "5": 0.10277547751412877, "1": 0.09872271669578984}, "score": 2.9658582670882163}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3032237491349266, "4": 0.2648510199370895, "2": 0.222262113974841, "5": 0.1351607321820914, "1": 0.07449066972725218}, "score": 3.163930951330202}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3232997395013723, "4": 0.2586079682725978, "2": 0.22898245364523806, "5": 0.1241861039751898, "1": 0.06491264733931917}, "score": 3.148174070744479}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31123264244601156, "4": 0.30107186156105914, "2": 0.18957929475560562, "5": 0.15931234018507712, "1": 0.038792137292078054}, "score": 3.3525371056519284}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3143000424866416, "4": 0.2679326060654972, "2": 0.23053882328287234, "5": 0.12203929450511203, "1": 0.06518005250725113}, "score": 3.15111365417587}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28184249287149443, "2": 0.2518140400976578, "4": 0.21191161534303768, "1": 0.13461469397644088, "5": 0.1198073791046838}, "score": 2.930482265715284}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27471016020937666, "2": 0.2500587221754807, "4": 0.21200199372312117, "1": 0.1386458137927041, "5": 0.12457155365720944}, "score": 2.9337939729293265}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2831043277443573, "2": 0.24456890248830646, "4": 0.22197012016938927, "5": 0.1252908179865848, "1": 0.12505683062494485}, "score": 2.977868993203471}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29613554712483114, "2": 0.26713842746716754, "4": 0.2090639694343095, "1": 0.11943136787566751, "5": 0.10822125392724848}, "score": 2.919504554662526}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.279572172411728, "2": 0.246822308507667, "4": 0.21493678872777772, "1": 0.14108836256934085, "5": 0.11757163165983157}, "score": 2.9210803289490865}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30246836061189536, "4": 0.2936543158097608, "2": 0.20148007215094532, "5": 0.1501757355958814, "1": 0.05221568762650608}, "score": 3.288096018680226}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29755047634558046, "4": 0.28883453444768364, "2": 0.1986503767840891, "5": 0.1487598378405712, "1": 0.06619585045184977}, "score": 3.2553144109000884}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31260420793528365, "4": 0.27971252490357296, "2": 0.22106707869755063, "5": 0.12027187185590794, "1": 0.06633789343747735}, "score": 3.1665144725936836}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3202721743028908, "3": 0.2766780563989284, "5": 0.19103580648455654, "2": 0.16359680243873562, "1": 0.0484093258969216}, "score": 3.4419317953443382}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31262918600935846, "4": 0.2865614731141058, "2": 0.2158200112326866, "5": 0.12187682200393447, "1": 0.06310656964732178}, "score": 3.1882830846182073}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.282558011227241, "2": 0.2543649073087313, "4": 0.21889349317454168, "1": 0.12950224008998384, "5": 0.1146698326887858}, "score": 2.9348630209778337}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29189927057844306, "4": 0.2721610206929747, "2": 0.21135728154915073, "5": 0.14591700176238342, "1": 0.07865597365327796}, "score": 3.1953276415527605}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.302353958471605, "4": 0.24118820901614912, "2": 0.24091052017884299, "5": 0.1214358183262579, "1": 0.09410090641234004}, "score": 3.054948094433301}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29164443705751786, "4": 0.2458104176795385, "2": 0.23144356844216135, "5": 0.13459181142353696, "1": 0.09650157012926297}, "score": 3.0905480738916564}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2926675955965689, "2": 0.2608824907639703, "4": 0.22030022584591263, "1": 0.1168540451829987, "5": 0.10928682837301427}, "score": 2.9442828103574294}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27850969743155074, "2": 0.25682093189335187, "4": 0.20051388154374, "1": 0.15224119600126143, "5": 0.11189990641406954}, "score": 2.8630083996167515}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2682946934944923, "3": 0.2593832970194689, "1": 0.19235366426082184, "4": 0.17150893750538374, "5": 0.10844366038367192}, "score": 2.735390069355062}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2733408029225275, "3": 0.2629816029530236, "1": 0.1914978878358633, "4": 0.17184758993858942, "5": 0.10030972796835005}, "score": 2.7161241117593096}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2591034438282729, "3": 0.2581130014071309, "4": 0.18886722953811222, "1": 0.17457470850364376, "5": 0.11932674407770612}, "score": 2.819265168852957}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.259416500206446, "3": 0.25204392527840935, "1": 0.20269611337101398, "4": 0.17167096988661848, "5": 0.11415223804756239}, "score": 2.7351613552005936}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "human", "scores": {"3": 0.34831581373980813, "4": 0.2797814265833503, "2": 0.21586169010082082, "5": 0.10971455943967712, "1": 0.04631839947328252}, "score": 3.190713603229096}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3184053889693959, "2": 0.26599299636551904, "4": 0.22436569305959983, "1": 0.10089622152946694, "5": 0.09033262392772487}, "score": 2.937245057427316}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.35844250800130967, "2": 0.2910822807672219, "4": 0.20876046182082839, "1": 0.07256729069985031, "5": 0.06914099178505917}, "score": 2.910825006535964}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3293912911871195, "4": 0.299395780584517, "2": 0.20238436349756408, "5": 0.12712905848126255, "1": 0.04169178800109921}, "score": 3.2678880256736154}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32803315283150186, "2": 0.2744518069809718, "4": 0.22838595410605164, "5": 0.08670056313529091, "1": 0.0824185702785509}, "score": 2.9624977595912254}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "human", "scores": {"2": 0.27410536574459693, "3": 0.27274575993481553, "4": 0.18667741597475368, "1": 0.16620669742334385, "5": 0.10025700900275133}, "score": 2.7806709731679593}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2678500687450955, "2": 0.24855664791692741, "4": 0.20533370377896876, "1": 0.1470743408453922, "5": 0.13117739651166438}, "score": 2.9249825788928194}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28459649754224103, "2": 0.2691413426536542, "4": 0.19528065475490827, "1": 0.1459076633731023, "5": 0.10506187675148373}, "score": 2.84444587766467}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2709223040856295, "2": 0.2372813526404474, "4": 0.22681351929967217, "5": 0.13997156278071432, "1": 0.12500343025704527}, "score": 3.0194685841638087}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26961876479790525, "2": 0.24340749645298695, "4": 0.216759659315156, "5": 0.13632921771127066, "1": 0.13387279780304215}, "score": 2.9782647404662015}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2815522600901802, "4": 0.23432456376917316, "2": 0.23243938444745005, "5": 0.13297328973358913, "1": 0.1186962345831301}, "score": 3.030439723917642}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28414898025539354, "4": 0.2560993304982771, "2": 0.21738102274206772, "5": 0.15037309095446982, "1": 0.09198876766358213}, "score": 3.1554883238614484}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29959842031495076, "4": 0.2578314505476467, "2": 0.22376231147252656, "5": 0.13188876513874842, "1": 0.08690752123463207}, "score": 3.1240330571446893}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2901275572854543, "4": 0.27638421444207906, "2": 0.20142483388867338, "5": 0.1594179833469432, "1": 0.07263772964969661}, "score": 3.248521796940037}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2845339216529027, "4": 0.26613398340551037, "2": 0.21007965723956054, "5": 0.15459399279804706, "1": 0.08464866003521891}, "score": 3.1959469090063948}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27897954925741314, "2": 0.2537363102081779, "4": 0.2011297010842368, "1": 0.15542275860530722, "5": 0.11071964426969821}, "score": 2.8579854528360693}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27891620019533503, "2": 0.24303201386954357, "4": 0.21890211774807572, "1": 0.13749694229188175, "5": 0.12164417429090292}, "score": 2.9441640903899726}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2786046854329087, "2": 0.2545346762034931, "4": 0.20181026604155844, "1": 0.15259610266587859, "5": 0.11244395041759603}, "score": 2.866969912572291}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2939652840729896, "2": 0.25706312543163684, "4": 0.21431572516143002, "1": 0.12605675965638452, "5": 0.10859271008766123}, "score": 2.9223240038085296}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2836659685856651, "2": 0.2523001320374866, "4": 0.2101827476054013, "1": 0.14382347492126538, "5": 0.11001930814523679}, "score": 2.8902733637460143}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "human", "scores": {"3": 0.25471986660982393, "2": 0.22390157970457883, "4": 0.22059518483165189, "5": 0.15199259141720634, "1": 0.1487769908387256}, "score": 3.0031248493650766}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26851054286840065, "2": 0.24267021434666325, "4": 0.21100169760860996, "1": 0.15428676465396393, "5": 0.12352232129681615}, "score": 2.906801808163126}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2649897587418157, "2": 0.2533913873578659, "4": 0.20570614688572866, "1": 0.15676125497082813, "5": 0.11914151389557767}, "score": 2.877074055721112}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.24779811915238018, "4": 0.23360407122283258, "2": 0.20847121600651133, "5": 0.17421677880501127, "1": 0.1358977247574691}, "score": 3.1017721937429066}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.25775238576696763, "2": 0.24103973103809845, "4": 0.21284425029845214, "1": 0.15446179419322434, "5": 0.13389451373196004}, "score": 2.9306694504935398}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "human", "scores": {"3": 0.276428356525777, "2": 0.2561244550749393, "4": 0.19910465260563712, "1": 0.15493247533234608, "5": 0.11339253712945133}, "score": 2.859897866068722}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2812333576540178, "2": 0.23938814660792615, "4": 0.21626998959688123, "5": 0.13160619325369152, "1": 0.13148325156507662}, "score": 2.977127290382093}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2817034097455524, "4": 0.23511354766015785, "2": 0.23308641834409866, "5": 0.13694447873554458, "1": 0.11313516778824968}, "score": 3.04964659409694}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2844156370413543, "4": 0.24623372314946199, "2": 0.2196142677320264, "5": 0.1501944336388921, "1": 0.09952880293243486}, "score": 3.1279523975498145}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27981995513842095, "2": 0.24003392775151797, "4": 0.22325110714984456, "5": 0.131668800045918, "1": 0.12520936785402914}, "score": 2.9961359787040243}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29039593327602164, "4": 0.24055204729047408, "2": 0.23290037312748882, "5": 0.13559486132869364, "1": 0.10054955383685739}, "score": 3.077742851316136}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2919455402796067, "2": 0.23502057863789425, "4": 0.2350084753897557, "5": 0.1256195354525594, "1": 0.11238705693240049}, "score": 3.0264533514672225}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29720542874595296, "4": 0.238448052881978, "2": 0.23791290920229455, "5": 0.12174251467722892, "1": 0.10468053400755975}, "score": 3.034659471039845}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3079478279898354, "2": 0.2550251783680041, "4": 0.22617435383485532, "1": 0.1090117068747052, "5": 0.1018287294545041}, "score": 2.9567826932249925}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2980562058579007, "2": 0.247900257801506, "4": 0.22480062066524956, "5": 0.11661924117806814, "1": 0.11260389189219706}, "score": 2.984930763326728}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2843989992132486, "3": 0.28328698893765464, "4": 0.17456566576795216, "1": 0.17365937731707448, "5": 0.0840761956689912}, "score": 2.7109966117907813}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3130262268810804, "2": 0.27104581861865545, "4": 0.20895520084865657, "1": 0.11225042120317483, "5": 0.09471167522106169}, "score": 2.9028308547120996}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3187258978361875, "2": 0.27316878903413944, "4": 0.20306919417790714, "1": 0.12067005211697729, "5": 0.0843589727858791}, "score": 2.8572772339992887}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3296146942076104, "2": 0.29456045995502417, "4": 0.19261492315256096, "1": 0.11067697007281216, "5": 0.07252325572036382}, "score": 2.82174530597619}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3156014801707589, "2": 0.2776707832397402, "4": 0.20304212685840015, "1": 0.12155388701479114, "5": 0.08212317702404903}, "score": 2.846508611947009}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3232047356694298, "2": 0.250434442323491, "4": 0.23947769451917314, "5": 0.09663009923625095, "1": 0.09024076625206394}, "score": 3.00182194050469}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3224598327872957, "4": 0.24899852655119947, "2": 0.23114101503847806, "5": 0.11597475973998247, "1": 0.08141685203042978}, "score": 3.0869741109036437}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3129259180507137, "4": 0.24510825717770696, "2": 0.2317011463487358, "5": 0.11614233664860592, "1": 0.09410912178006539}, "score": 3.057474300375968}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3130174622694328, "4": 0.2762690967590208, "2": 0.20816806931600615, "5": 0.13562687905499723, "1": 0.06690891915712961}, "score": 3.205538914953922}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3126719253402526, "2": 0.25562360740610207, "4": 0.22874345208528138, "1": 0.1030042839365931, "5": 0.09994701334229485}, "score": 2.9670049828486533}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30241525183085927, "2": 0.2832358319270696, "4": 0.1874264644683915, "1": 0.14093340572434546, "5": 0.08597996284925387}, "score": 2.7942818782122787}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29160670070895706, "2": 0.24319013330623113, "4": 0.22273942243975614, "5": 0.12185990667499129, "1": 0.12059030350932956}, "score": 2.982088253058716}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3093052579254317, "2": 0.25862801116679107, "4": 0.2204908679821063, "1": 0.10944567188678, "5": 0.1021197126969003}, "score": 2.947210385287919}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.298921972854611, "2": 0.2524613780964139, "4": 0.22031710148954134, "1": 0.11538985965994726, "5": 0.11289779935506196}, "score": 2.962871161375509}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3075920152230968, "2": 0.2887604001382366, "4": 0.18664977109660158, "1": 0.13553869601309368, "5": 0.0814500117234319}, "score": 2.789710087519991}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2964310304242352, "2": 0.24619142382944056, "4": 0.22775456480302694, "1": 0.11533742688498257, "5": 0.11426755577067438}, "score": 2.9794230283947165}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3030061429245177, "2": 0.24560473587902729, "4": 0.2388779086604421, "5": 0.11435087575435471, "1": 0.09814941681991886}, "score": 3.0256763710352756}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3040935179643554, "2": 0.2644122343366631, "4": 0.2183970811278322, "1": 0.10693473327711385, "5": 0.10615074207950322}, "score": 2.952416308084797}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3159075725846589, "4": 0.2685781623360286, "2": 0.2279493098420012, "5": 0.12053120462886835, "1": 0.06702329724212863}, "score": 3.147646210667432}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31394699909878493, "2": 0.2598158936850578, "4": 0.2242762562881821, "1": 0.10145777265719967, "5": 0.10049076964794573}, "score": 2.962525895329996}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27651237586941785, "2": 0.24010023427887286, "4": 0.21622472902474274, "1": 0.13459801624906373, "5": 0.1325539826898856}, "score": 2.972036129479857}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2792697551321579, "2": 0.26119380482212995, "4": 0.1983237267167464, "1": 0.15141352637418906, "5": 0.10978243888424492}, "score": 2.8538652994404563}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2735560068060482, "2": 0.2507042052314136, "4": 0.20270839712767835, "1": 0.14805478570988043, "5": 0.12496317313591689}, "score": 2.9058197017196017}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28668179687470935, "2": 0.25823824239886006, "4": 0.20162275038902505, "1": 0.14010797550905182, "5": 0.11333721507101227}, "score": 2.889841663037606}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2815531047482274, "2": 0.25231711240775573, "4": 0.20936783455695185, "1": 0.14031112509094198, "5": 0.11643745699036259}, "score": 2.909302173662229}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2617674669591146, "2": 0.2391612424321169, "4": 0.2086100832199574, "1": 0.15285167075826434, "5": 0.13759674627771593}, "score": 2.938938210824916}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2672261166880763, "2": 0.23725143334833046, "4": 0.21624992067305912, "5": 0.14210989673983726, "1": 0.13715172283405844}, "score": 2.9889147141989594}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26254867121110304, "2": 0.22832082771940476, "4": 0.21905612575805658, "5": 0.14800524006502952, "1": 0.14205481141185203}, "score": 3.0026361931054004}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26376118170512125, "4": 0.2335324124867936, "2": 0.2260173528805924, "5": 0.14965699550537523, "1": 0.12702265787142766}, "score": 3.052784231022151}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26769979345770545, "2": 0.24896932073698955, "4": 0.20882069790270072, "1": 0.14939093263391182, "5": 0.12510632540471955}, "score": 2.9112810155829263}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.28311372696406456, "3": 0.2747923657866524, "1": 0.17762109097234943, "4": 0.17325187819820626, "5": 0.09120960221490969}, "score": 2.7173119692062424}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2898659802177754, "3": 0.2864037071557056, "4": 0.18480612063569393, "1": 0.14940387044887724, "5": 0.08951413797281199}, "score": 2.7751592851476836}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.29402208365253524, "3": 0.29009767568598266, "4": 0.17743126224978678, "1": 0.151789892584838, "5": 0.0866492515916303}, "score": 2.7531254687886246}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.280402221848408, "2": 0.2800831375677644, "4": 0.18595209355051145, "1": 0.15660169057274823, "5": 0.09694675196701179}, "score": 2.7865560682527146}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29196612316573456, "2": 0.28298111924876473, "4": 0.1860751601615504, "1": 0.14768237888221097, "5": 0.09128502724096917}, "score": 2.7902972004859996}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.31946786156658025, "3": 0.3085482024592932, "1": 0.1831154959146156, "4": 0.13109736337117026, "5": 0.05773900138074758}, "score": 2.5608624272641327}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.31381061875845107, "3": 0.298634816961369, "1": 0.19637167783564893, "4": 0.13252751430249887, "5": 0.058602694630543684}, "score": 2.54315486366892}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.304455787322999, "2": 0.29916279167203325, "1": 0.1697291581088181, "4": 0.15317907762951266, "5": 0.07345225321336732}, "score": 2.6614553897327613}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.29906034596071507, "3": 0.28931957672545544, "1": 0.20328704173511006, "4": 0.139575835747693, "5": 0.06871299787851733}, "score": 2.57134845483855}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30318557566798066, "2": 0.27385730306137424, "4": 0.18072883865707576, "1": 0.14631847460724995, "5": 0.09588481995274872}, "score": 2.805999378588779}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2796194520634647, "2": 0.25351917950906583, "4": 0.19737504073945378, "1": 0.15037485032992634, "5": 0.11910066727401636}, "score": 2.881306212028741}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28528442896852474, "2": 0.2396875449223701, "4": 0.21483321415908724, "1": 0.13569766762762053, "5": 0.12448732194869096}, "score": 2.952724513521363}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2837617503837175, "2": 0.24199086535616365, "4": 0.2126554560911164, "1": 0.14089379491155693, "5": 0.12068630746777077}, "score": 2.930248790984253}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29573899124346237, "2": 0.25872566167137956, "4": 0.19950790886588085, "1": 0.13794148575684365, "5": 0.10807634537227771}, "score": 2.8810508236699084}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28253433385799576, "2": 0.25827649031474753, "4": 0.19592953494099843, "1": 0.15554800207239836, "5": 0.10770263812440191}, "score": 2.8419608942693446}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3393769644079402, "2": 0.2639171370276819, "4": 0.23350656187958882, "1": 0.08285774146048393, "5": 0.08033129563666458}, "score": 2.9645361679414215}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3230054444561973, "4": 0.2523050771685367, "2": 0.24180042092615572, "5": 0.10627178041972403, "1": 0.07660559983592406}, "score": 3.069837832919866}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32592965601310303, "4": 0.263744064159899, "2": 0.22744705339663163, "5": 0.11242791705347253, "1": 0.07044045753423095}, "score": 3.1202732349879736}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.33636536969976694, "4": 0.24806285930362318, "2": 0.2447826757116444, "5": 0.09809837277099734, "1": 0.07268087474207277}, "score": 3.054115712569021}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3215306517614591, "2": 0.24905034853646535, "4": 0.24332935085282348, "5": 0.10622935456868732, "1": 0.07984776457633233}, "score": 3.047042771733084}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.258588909567658, "2": 0.2521385351159919, "4": 0.18951634592504912, "1": 0.17812243999863267, "5": 0.12161616286320341}, "score": 2.8243621641654673}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28207959389890563, "2": 0.2437343198485085, "4": 0.21881566848641845, "1": 0.13121899945989707, "5": 0.12413948084718726}, "score": 2.960921844918613}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2739269264365686, "3": 0.2707810278598612, "4": 0.18110715614358386, "1": 0.17292443012582137, "5": 0.10124797228609779}, "score": 2.7638243648674425}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2799642955042503, "2": 0.25291315754220206, "4": 0.2052662216818269, "1": 0.1456152514114937, "5": 0.1162277558907758}, "score": 2.893576655755341}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2689126697121667, "2": 0.25457179006481834, "4": 0.20219920583998346, "1": 0.15714464374959722, "5": 0.1171590342567486}, "score": 2.867654521775243}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30934117035055275, "4": 0.25556998319864427, "2": 0.2353653244045082, "5": 0.12099725737071611, "1": 0.07870994229203558}, "score": 3.1047809992271547}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3095555252124898, "4": 0.27895209902034, "2": 0.21126166401434854, "5": 0.1408428569254598, "1": 0.059378278577763}, "score": 3.2306218001933065}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.31589354659981533, "3": 0.29662890486430155, "2": 0.17507899620961273, "5": 0.17214223435052622, "1": 0.04024755589769165}, "score": 3.404607452497951}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.32791183580723643, "3": 0.2594669097295627, "5": 0.23043376763122178, "2": 0.14467617643276237, "1": 0.037501362999986104}, "score": 3.5691061297628224}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3007320830900132, "4": 0.2512485476809214, "2": 0.23734708867914983, "5": 0.12235001090058487, "1": 0.08830526913937409}, "score": 3.081992336435725}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27689223273310676, "2": 0.26135299870089823, "4": 0.20085082713752264, "1": 0.1545060692877581, "5": 0.10638439248555968}, "score": 2.8432523619281205}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28047064833823127, "2": 0.25999525451462596, "4": 0.20793609127051255, "1": 0.14405070836064457, "5": 0.10753645205589699}, "score": 2.8749109674982822}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.270706140184998, "2": 0.26823647986241145, "4": 0.19143506768507362, "1": 0.16716893350353626, "5": 0.10244279845837272}, "score": 2.793744135482256}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27667116720109486, "2": 0.2615126818747815, "4": 0.20188601964867905, "1": 0.14861091458020892, "5": 0.1113048662203575}, "score": 2.865759314636612}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.28353111748099363, "3": 0.2638242545437244, "1": 0.19155862144490085, "4": 0.17341101378759427, "5": 0.08766329467460574}, "score": 2.682085523780792}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2770506326911575, "2": 0.2581977021772941, "4": 0.2112628470829796, "1": 0.14730419155678245, "5": 0.1061729086685608}, "score": 2.8708010651989633}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2844382205394885, "2": 0.24166171564297972, "4": 0.23951414579815092, "5": 0.12216371592816162, "1": 0.11221176881443586}, "score": 3.017756509641203}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2844837911925307, "2": 0.2639096682783873, "4": 0.21032365929707988, "1": 0.1400256162354519, "5": 0.10124657507372102}, "score": 2.868854506760029}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2900957030284951, "4": 0.24310862963432545, "2": 0.23720042977324135, "5": 0.12157163517787967, "1": 0.10801508345384674}, "score": 3.0330215846177913}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2899908233856622, "2": 0.24842343240958642, "4": 0.2301554566263363, "1": 0.11816333697520406, "5": 0.11325941312177965}, "score": 2.9719239648873077}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2784596815814499, "2": 0.25069703519367603, "4": 0.19986814596964572, "1": 0.15220951790459386, "5": 0.11874568186151488}, "score": 2.8822410908728426}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2849924187341798, "2": 0.2503214217268939, "4": 0.19031356976439842, "1": 0.16264105873488113, "5": 0.11170494539318256}, "score": 2.838115617553148}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28235554621692194, "2": 0.25656642013443437, "4": 0.2023465616292672, "1": 0.14680858259017146, "5": 0.11190697871163716}, "score": 2.8759749604103884}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2774022666727906, "2": 0.24531798794864976, "4": 0.20517032318486386, "1": 0.14780541999455193, "5": 0.12428768005244197}, "score": 2.9128154323126907}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27906314405224564, "2": 0.24321107287814445, "4": 0.2067707060317323, "1": 0.14351930833166207, "5": 0.12742032648789361}, "score": 2.9313606095215974}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29059317907208565, "2": 0.250542803700116, "4": 0.21460945307757343, "1": 0.13276060965262682, "5": 0.11148518130595131}, "score": 2.921515104121074}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2845787961906116, "4": 0.23923383888514954, "2": 0.23026252682645815, "5": 0.1359867261292878, "1": 0.10992961298017401}, "score": 3.0610860575266083}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3001705997865443, "2": 0.2414962823509316, "4": 0.23076285442503816, "5": 0.11787043102116315, "1": 0.10969269550679409}, "score": 3.005622083227144}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30141778095129707, "4": 0.26144461898245924, "2": 0.21706830616912481, "5": 0.13761641025771693, "1": 0.0824437694869878}, "score": 3.1547230045238384}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2972381825889044, "2": 0.2425649425810194, "4": 0.22784782661124686, "5": 0.12136085485579493, "1": 0.11097873195912897}, "score": 3.006047187038438}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2926487484102985, "2": 0.26328454802937395, "4": 0.21422200396156502, "1": 0.12787413744899465, "5": 0.10196103994369517}, "score": 2.8991103002290806}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30349728929656966, "4": 0.264866567148266, "2": 0.2342991877930509, "5": 0.1247109773622706, "1": 0.07262016796995996}, "score": 3.1347497810939915}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3054492607771835, "2": 0.25390583729703525, "4": 0.24043218602201374, "5": 0.10562729138017314, "1": 0.09457972966865313}, "score": 3.008621521246331}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2978560985136142, "4": 0.24656897677450088, "2": 0.2422670860616957, "5": 0.12172917242878886, "1": 0.09157282698008563}, "score": 3.0646149589125495}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29726814570782517, "2": 0.25422957032142823, "4": 0.24164180353800072, "5": 0.10946986205318195, "1": 0.0973841999173688}, "score": 3.0115836318373015}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30690869071974197, "4": 0.25427080970215776, "2": 0.2236207147494553, "5": 0.12807580036326704, "1": 0.08710984243133545}, "score": 3.112583602977711}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30925444324609475, "4": 0.26694458204737614, "2": 0.21764869649453408, "5": 0.12756600016045933, "1": 0.07857569902976447}, "score": 3.1472780458718854}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3176656069311778, "4": 0.2484020192326339, "2": 0.23222078508681968, "5": 0.11427489198324474, "1": 0.087425961333444}, "score": 3.069879845635794}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3048868667116795, "4": 0.2953797093414889, "2": 0.18058368135996847, "5": 0.1669533745264173, "1": 0.05218198283976707}, "score": 3.3443437648158674}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3027462751531045, "4": 0.2596766956490771, "2": 0.21815272240082784, "5": 0.13295230820395537, "1": 0.08646059655380767}, "score": 3.1345089302246443}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3092630406391202, "2": 0.28786870160608774, "4": 0.18538615592956442, "1": 0.1366417420265226, "5": 0.08083134948722191}, "score": 2.7858947400897933}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3058832456505932, "2": 0.24466060855907817, "4": 0.2247702746298632, "5": 0.11341246194856905, "1": 0.11126618337232777}, "score": 2.984402110515421}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31823136431721943, "2": 0.24444549970653204, "4": 0.22840171328057018, "5": 0.10651366416967359, "1": 0.10240056999856355}, "score": 2.9921823457188363}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.32123279520145703, "2": 0.27082002313546544, "4": 0.21004930292224167, "1": 0.11103053782129192, "5": 0.08686062121412398}, "score": 2.8908887133767363}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30963608204013887, "2": 0.28382986137680183, "4": 0.18627405047349557, "1": 0.1380124335079234, "5": 0.0822362234018357}, "score": 2.7908893956464884}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2798166532824313, "3": 0.27389624833881315, "1": 0.18967788265665328, "4": 0.1662469243113774, "5": 0.09034500937946867}, "score": 2.6877591283180724}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28153663437336285, "2": 0.27331431748196466, "4": 0.18013361462331803, "1": 0.169852697982614, "5": 0.09514687772681257}, "score": 2.757403809584989}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28107152631288024, "2": 0.27211331504756925, "4": 0.17840420294589113, "1": 0.17612774911489004, "5": 0.09226775947093269}, "score": 2.7385668702246595}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27977082306822065, "2": 0.24734936710844724, "4": 0.20288353171166648, "1": 0.1499237121389214, "5": 0.12005808639793263}, "score": 2.895801404369881}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2799267828020599, "2": 0.269561584722053, "4": 0.18422869233507505, "1": 0.16801013063468498, "5": 0.09825941557500105}, "score": 2.7751626660378883}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27587596953824833, "4": 0.23235074897008176, "2": 0.23014408722760543, "5": 0.1408915688071836, "1": 0.12072167373676423}, "score": 3.042547130583234}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.264411123807611, "4": 0.24790043133174722, "2": 0.2161500362847785, "5": 0.1660941139127708, "1": 0.10543315803355004}, "score": 3.153074011533969}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26999630642087996, "4": 0.2551032790342222, "2": 0.2117261679152618, "5": 0.1620579648551241, "1": 0.10109519310810007}, "score": 3.1653061406990655}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27952864641307046, "4": 0.25234867925298293, "2": 0.21831170456131768, "5": 0.1501838753413358, "1": 0.09961046994366307}, "score": 3.135186032885542}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2803856786053494, "4": 0.2540898079119049, "2": 0.21871348355481712, "5": 0.14847382483693533, "1": 0.09832293132907556}, "score": 3.1356800480375098}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28420570205249956, "2": 0.25877272814980407, "4": 0.20785280875495124, "1": 0.1385300790053923, "5": 0.11062775190345613}, "score": 2.8932742598746453}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28706913607069623, "2": 0.259418575546749, "4": 0.21751394838585356, "1": 0.12525178344959692, "5": 0.11073857894773716}, "score": 2.929068397971481}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2975116187908233, "2": 0.26568496877088005, "4": 0.21101925368017344, "1": 0.12316205136090977, "5": 0.10261332308974286}, "score": 2.9042359871464263}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2804373584480676, "2": 0.2414047001806925, "4": 0.22481186097728825, "5": 0.1281643313252428, "1": 0.1251679554451331}, "score": 2.989399766341182}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28268321215617287, "2": 0.25133205144669807, "4": 0.21114406626207777, "1": 0.13992337886698564, "5": 0.11490612365841744}, "score": 2.9097764968173783}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2783517993583677, "3": 0.2638600843102775, "1": 0.19266969136014503, "4": 0.16993249653407916, "5": 0.09517613989054066}, "score": 2.6965906242996933}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.26511971507671894, "3": 0.2649210558050946, "1": 0.1819159885226542, "4": 0.1811131327783505, "5": 0.10692331325743978}, "score": 2.766006477288233}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2905525860404585, "3": 0.2739304327236671, "1": 0.1794705592187939, "4": 0.16868672204944157, "5": 0.08735126155293085}, "score": 2.693892957619088}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2673558864667931, "2": 0.23355873307281805, "4": 0.21758859022562013, "5": 0.14089444302450416, "1": 0.14059243586802198}, "score": 2.984633719165298}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2667359129844526, "2": 0.25432802707105334, "4": 0.19944206217375868, "1": 0.1595400964418241, "5": 0.11993983942944578}, "score": 2.865911635540848}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2570775984930115, "3": 0.24755893601687973, "1": 0.1922416701026208, "4": 0.18147000511658382, "5": 0.12163929645731505}, "score": 2.783184950486149}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.26053001596311365, "3": 0.25109513192593913, "4": 0.19507251846267318, "1": 0.17385984375751587, "5": 0.11943344599954817}, "score": 2.82568813052604}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.25444674966304937, "2": 0.25089305659156663, "4": 0.2017113225500187, "1": 0.16398857798767152, "5": 0.12895027681143142}, "score": 2.8807404690552523}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2621933684303597, "2": 0.258603985740552, "4": 0.20581363585053486, "1": 0.15077361583834148, "5": 0.12260706876562578}, "score": 2.89087564746344}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.248367617935315, "2": 0.23225817564307769, "4": 0.21835829725033415, "5": 0.15661780571581807, "1": 0.1443885282400878}, "score": 3.010558777661287}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.25216864225444513, "3": 0.24519420719883175, "1": 0.18723111802258288, "4": 0.18713400771114566, "5": 0.1282616962832466}, "score": 2.817024632111498}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.24557123767768266, "3": 0.2434887350884658, "4": 0.19151426160524193, "1": 0.17935629081226417, "5": 0.14005844208693696}, "score": 2.867345862939706}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.27384191271341507, "3": 0.24408555009417468, "1": 0.20043685890744675, "4": 0.17053411743811864, "5": 0.11109002170571126}, "score": 2.717995276228925}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.26734997796699134, "3": 0.24894009345441004, "1": 0.18552589703890862, "4": 0.18105406330919244, "5": 0.11712002679344422}, "score": 2.776890126818512}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.27232940435155195, "3": 0.24898288993472695, "1": 0.18530491898179807, "4": 0.17914830439468915, "5": 0.11422446217660048}, "score": 2.7646556282443333}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "human", "scores": {"3": 0.263813200539042, "2": 0.25269491183261106, "4": 0.19610765702691227, "1": 0.16530181403780148, "5": 0.12206784283469377}, "score": 2.8569427179100333}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2983673301672473, "2": 0.24170821583024402, "4": 0.2332537178607849, "5": 0.12484149329252311, "1": 0.10181883218301632}, "score": 3.037591215599152}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2942030511095354, "4": 0.2470708849309356, "2": 0.22175231902760134, "5": 0.14306759043590817, "1": 0.09389405563907019}, "score": 3.123667131727946}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29369707499093556, "2": 0.2398485251750546, "4": 0.23376793184039266, "5": 0.12813507474816654, "1": 0.10454151643660062}, "score": 3.0411069292937536}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28413034069367304, "2": 0.26010231659812727, "4": 0.20841847946031608, "1": 0.13133612529327993, "5": 0.11599815420827489}, "score": 2.9176390195605326}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28916598881141425, "2": 0.261542836025355, "4": 0.20049092401864663, "1": 0.1471053620949523, "5": 0.1016817948814651}, "score": 2.8480989645486146}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2881506630625728, "2": 0.25898032122382614, "4": 0.20170755058355502, "1": 0.14895579424130964, "5": 0.10219467564261835}, "score": 2.849203334115891}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2979544370416146, "2": 0.25486512380740817, "4": 0.21122330237950537, "1": 0.13547974950212366, "5": 0.10046880476654968}, "score": 2.886335313573461}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30201913581162626, "2": 0.25617612058781974, "4": 0.2115692523101719, "1": 0.13197459988836402, "5": 0.09824819499044994}, "score": 2.8879388991526667}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.299898738391483, "2": 0.257183253383543, "4": 0.2076090157842937, "1": 0.13719343701529207, "5": 0.09810609341673783}, "score": 2.8722498664307734}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2886369237224113, "2": 0.2480557896128766, "4": 0.2231992296209453, "1": 0.12346726731842558, "5": 0.1166256554127228}, "score": 2.9614596329147}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31034593013479617, "4": 0.24353105710830117, "2": 0.23882667484405767, "5": 0.11615906234930483, "1": 0.09112664834344143}, "score": 3.0547697923266077}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3046299858493767, "2": 0.26352466765325355, "4": 0.216160498199711, "1": 0.11585985092461643, "5": 0.09981458141245356}, "score": 2.920544463916399}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29868128815425327, "2": 0.2597176758649045, "4": 0.21865122468901915, "1": 0.11833452592336453, "5": 0.10460528529447234}, "score": 2.9314743823050833}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3080371766141266, "2": 0.2704171262758629, "4": 0.21288654665299012, "1": 0.11774462437429066, "5": 0.09090169782775799}, "score": 2.888782140553003}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28486499861778347, "2": 0.27030833231506246, "4": 0.18717710963611772, "1": 0.15503239250403236, "5": 0.102605493991875}, "score": 2.812012785934186}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.291604921913508, "2": 0.2760617793744003, "4": 0.19204003750914075, "1": 0.14331350582282235, "5": 0.09696744261149477}, "score": 2.8232839558483196}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.30159383018616676, "3": 0.28848519832002195, "4": 0.1652317409251991, "1": 0.16466165271913266, "5": 0.0800135406904705}, "score": 2.694337396047133}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2792780495670571, "2": 0.27416378382226225, "4": 0.18268262890565992, "1": 0.16949605953720043, "5": 0.09436755140855424}, "score": 2.7582589456387447}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28094625255204597, "2": 0.2646751907652879, "4": 0.1910384236930332, "1": 0.15286119371398957, "5": 0.11046824222616568}, "score": 2.84157563527883}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2734412194398054, "4": 0.2552800247652626, "2": 0.21579674708943558, "5": 0.15449414187961297, "1": 0.1009774958837063}, "score": 3.1465180891982714}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2962765411991901, "3": 0.2735384177203057, "5": 0.18864119639509577, "2": 0.1800486836389619, "1": 0.061487209586656835}, "score": 3.3705387775012956}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28695912355608566, "4": 0.26555330136832217, "2": 0.20999024536214206, "5": 0.1513452391357863, "1": 0.08614020668078864}, "score": 3.185975331027831}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.30601869014186883, "3": 0.2754405949377853, "5": 0.1925289012808042, "2": 0.17132303688549072, "1": 0.05467870230187003}, "score": 3.410400185771293}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2788064961423803, "4": 0.2746075751234958, "2": 0.19307535999384937, "5": 0.17633947615164108, "1": 0.07715905795503678}, "score": 3.2798964199737135}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31050244600710575, "2": 0.29247277311800446, "4": 0.18651860241871301, "1": 0.1320615998130171, "5": 0.07843233503370443}, "score": 2.786784689217088}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3087097079878761, "2": 0.2874002314540081, "4": 0.19407344676390356, "1": 0.1277443854978907, "5": 0.08206370853669945}, "score": 2.8153102878755605}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.34000569891421684, "2": 0.3277264213130657, "4": 0.16802217739292258, "1": 0.11197471411573533, "5": 0.05226163152464125}, "score": 2.720866979122729}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3188046966172607, "2": 0.2915845686002974, "4": 0.19938724308609593, "1": 0.10429181454174925, "5": 0.08592237556803832}, "score": 2.871062597215964}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31643440818403734, "2": 0.2818476224515437, "4": 0.20354151296288636, "1": 0.11363915020281987, "5": 0.08452501947356376}, "score": 2.8634639514719296}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29849687954193027, "2": 0.26152269800230493, "4": 0.2133053439795231, "1": 0.12065770820204774, "5": 0.10600809710547165}, "score": 2.9224827049531097}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3089570526289437, "2": 0.25644919606817224, "4": 0.22518060722281735, "1": 0.1063718611422355, "5": 0.10303093459196112}, "score": 2.9620491653257335}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3039660382802564, "2": 0.25426539379159074, "4": 0.2232371097442495, "1": 0.11055697279396885, "5": 0.10796359413808428}, "score": 2.9637845642094574}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31689940178376413, "4": 0.24826891142640412, "2": 0.2435956013901745, "5": 0.10990672801715881, "1": 0.0813221054201071}, "score": 3.0618430037134705}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3176664010961879, "2": 0.24697355817690242, "4": 0.2402701653006358, "5": 0.10785854272126442, "1": 0.08722348159250495}, "score": 3.0345670007706644}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2662114396640204, "2": 0.2525087442937552, "4": 0.202197992648388, "1": 0.15816006328295637, "5": 0.12091123471455648}, "score": 2.8751902775460394}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2593030821715665, "3": 0.2588228055175301, "4": 0.18768928927824627, "1": 0.17958420004630676, "5": 0.11459131075022828}, "score": 2.798398551154228}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2691388396508064, "2": 0.2519390968113265, "4": 0.20734145575732454, "1": 0.14771323295375502, "5": 0.12385905662046205}, "score": 2.9076932384527243}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.25547390694842853, "2": 0.2505966260746668, "4": 0.20426318379115446, "1": 0.16493629014146047, "5": 0.12472147846865492}, "score": 2.8732358550279766}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2648258338027132, "3": 0.2590471467668263, "1": 0.186958707877452, "4": 0.18097863379784165, "5": 0.10818152237796529}, "score": 2.758596460259231}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2958987334252412, "2": 0.23673725062565068, "4": 0.22998203081553137, "5": 0.12619581387345774, "1": 0.11117512702700184}, "score": 3.0232864110633444}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3073788048483208, "2": 0.24082301328345201, "4": 0.2372993392486614, "5": 0.11465616485934808, "1": 0.09983203052629261}, "score": 3.026124872788952}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2934403198245493, "2": 0.24781610994888864, "4": 0.21605177520462937, "1": 0.12867227642214352, "5": 0.11400906684753223}, "score": 2.9389086075944197}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3097513810150548, "2": 0.24770114994665543, "4": 0.23389289080923073, "5": 0.10903557214929908, "1": 0.0996086172061526}, "score": 3.0050457031680406}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31005034235313583, "2": 0.2674004316679907, "4": 0.20955419200817652, "1": 0.12057879974311313, "5": 0.09240547951337456}, "score": 2.88580589175571}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "human", "scores": {"2": 0.27757974991564505, "3": 0.26853454878398153, "1": 0.1959326894319046, "4": 0.16602382115286374, "5": 0.09190662159866254}, "score": 2.680384722136152}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29128395418632447, "2": 0.2607364635415273, "4": 0.19687204087330468, "1": 0.14982434566140046, "5": 0.10126473021219128}, "score": 2.8390133737307464}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27990595702414794, "2": 0.25732052298782176, "4": 0.1939595396840036, "1": 0.16052231689553126, "5": 0.10827952511051941}, "score": 2.8321513957297846}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28759771449077787, "2": 0.24511298781272095, "4": 0.2105474785470859, "1": 0.13675756763713218, "5": 0.1199691083209261}, "score": 2.931856540192501}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2779297486288908, "2": 0.2661581228525126, "4": 0.18237752994893217, "1": 0.1729138128917641, "5": 0.100598442856491}, "score": 2.7715835635582264}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2834787257716262, "2": 0.253503563208595, "4": 0.2047838594913363, "1": 0.14986337998744548, "5": 0.10836005003689325}, "score": 2.868272263580492}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2881781539471233, "2": 0.2681268471998867, "4": 0.20021802123367596, "1": 0.14455422244230404, "5": 0.09891416748561183}, "score": 2.8408096970432095}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2868160814004534, "2": 0.25684294239035144, "4": 0.20670529412905259, "1": 0.14208556960797727, "5": 0.1075402266516079}, "score": 2.8807704871443938}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28217204652936245, "2": 0.24888443667217378, "4": 0.21254418134853872, "1": 0.13953936934635497, "5": 0.11684975671823425}, "score": 2.918279685105939}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28875892746395126, "2": 0.26605019100794136, "4": 0.20845030739213044, "1": 0.1340731945733762, "5": 0.10265994064713609}, "score": 2.8795727126832986}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29210188977289686, "2": 0.24515105681570987, "4": 0.22680855213799014, "5": 0.12021932453033377, "1": 0.11570467955596712}, "score": 2.9906866502536396}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2800488854945968, "4": 0.2766225880095122, "2": 0.19593603990954037, "5": 0.17364468635518993, "1": 0.07373490372274208}, "score": 3.2805097309609748}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2929764056498051, "2": 0.24215927697638143, "4": 0.22564967341905082, "5": 0.12663644949593617, "1": 0.11256814583150872}, "score": 3.011627120608126}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3110213250067882, "2": 0.24351330434133417, "4": 0.2431220739132751, "5": 0.11281237934201209, "1": 0.08952067274340023}, "score": 3.0461926559969053}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2931941973273192, "4": 0.2703268220373341, "2": 0.207771429530135, "5": 0.15355384372634223, "1": 0.07514197161202696}, "score": 3.2193817113484435}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.27409314091790044, "3": 0.262770040503116, "1": 0.1870433071318042, "4": 0.17559366056479936, "5": 0.10048746355600979}, "score": 2.7283854679174544}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2844627970634336, "3": 0.27113050655995957, "1": 0.18528255402782912, "4": 0.169413992469711, "5": 0.08969442172304812}, "score": 2.6937701143652966}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2800389439356255, "3": 0.2656108530042232, "1": 0.19008907516955276, "4": 0.17217360152308753, "5": 0.09207758887703668}, "score": 2.696108665085184}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2749098371456308, "3": 0.26836695498502333, "1": 0.18280243490528597, "4": 0.1794155240383578, "5": 0.0944916035266326}, "score": 2.727880310953669}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26710981847362475, "2": 0.25866861895217197, "4": 0.18855924959949272, "1": 0.17407044593614676, "5": 0.11158049726460338}, "score": 2.8049085151581497}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2989797899548945, "2": 0.2573437086114396, "4": 0.22442107334629322, "1": 0.11298491101799872, "5": 0.10626266269212015}, "score": 2.9536325038952898}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30247552919698917, "4": 0.24659331433354734, "2": 0.2386383865068743, "5": 0.11845020709547725, "1": 0.09383434862210815}, "score": 3.057187114522381}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3063454782493096, "2": 0.24034007005887587, "4": 0.2379358689058204, "5": 0.11304309062433655, "1": 0.10232811651942962}, "score": 3.0190258873848963}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3051158617251777, "4": 0.2786544208080087, "2": 0.21443682631637453, "5": 0.13223775530712065, "1": 0.0695467076235424}, "score": 3.189601287860115}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29178580220172395, "2": 0.24859037934267522, "4": 0.23697867992875454, "5": 0.1138542337586002, "1": 0.10878354465267187}, "score": 2.998529667976123}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27460106700108694, "2": 0.26496773900779685, "4": 0.20585233245144127, "1": 0.14547530963505173, "5": 0.10909362723434422}, "score": 2.8681199197759164}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2856977914747998, "2": 0.2527046660444629, "4": 0.2239868576620229, "1": 0.12162703583417792, "5": 0.11597545559062851}, "score": 2.9599787032202123}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2940792471017045, "2": 0.2586414343088981, "4": 0.21549753672803942, "1": 0.12465691440418265, "5": 0.10711330280979282}, "score": 2.921767974504572}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2824779456326898, "2": 0.2511821514644159, "4": 0.22505861490856618, "1": 0.12419839900807744, "5": 0.11707105743844502}, "score": 2.9596213025623963}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28512916239279096, "2": 0.25549455007408106, "4": 0.22538372160849549, "1": 0.12343509594067502, "5": 0.11054967627455226}, "score": 2.9441178966732946}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2678901956908267, "2": 0.25972980496357967, "4": 0.19825266022896645, "1": 0.15622261027054096, "5": 0.11788971620116294}, "score": 2.8618549932046955}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27956344989602067, "2": 0.24534082811652108, "4": 0.21747023247582414, "5": 0.1314136890362169, "1": 0.1262007987065555}, "score": 2.9825549930926925}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29979562094741097, "2": 0.24680794386732693, "4": 0.23021182860013054, "5": 0.11967017045767595, "1": 0.10350369152547091}, "score": 3.015737011685141}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2967092725199368, "2": 0.2392334321879691, "4": 0.2292603549624492, "5": 0.13104635020515226, "1": 0.1037340361649404}, "score": 3.044652290027107}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28109884779304023, "2": 0.25388577952818103, "4": 0.21341191661314032, "1": 0.12969788430672413, "5": 0.12189172845077621}, "score": 2.9439130489441174}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3210920297183294, "4": 0.2819997202685534, "2": 0.20312528963576518, "5": 0.13528456907688283, "1": 0.05848904542333567}, "score": 3.232467650553982}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.32214407358901304, "4": 0.28727440644405094, "2": 0.19667048808472112, "5": 0.14142453863745894, "1": 0.05247936679831401}, "score": 3.2684961754612343}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33174519157398513, "4": 0.30653396931746585, "2": 0.1791297635046919, "5": 0.1423884916976636, "1": 0.040194785729154074}, "score": 3.3317942051397456}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3188361004264897, "4": 0.29736994774843023, "2": 0.19041623355337478, "5": 0.1475081279462696, "1": 0.045863797436406735}, "score": 3.310244172424844}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32086599630670676, "4": 0.2973281404728972, "2": 0.19017461548532272, "5": 0.15101750828220362, "1": 0.0406071467313408}, "score": 3.3279764103464418}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2904317993884681, "2": 0.23829649579505904, "4": 0.2303814651025311, "5": 0.1267438320528277, "1": 0.1141352306311773}, "score": 3.0173023655398308}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2872247122704061, "2": 0.2379750839682485, "4": 0.2315123868444078, "5": 0.12896866643205349, "1": 0.11430981972692221}, "score": 3.0228552095428505}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28838822589832425, "4": 0.2506884615016834, "2": 0.22376830838283224, "5": 0.14183483955981976, "1": 0.09531171007046836}, "score": 3.1199674263725816}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3041077194632467, "4": 0.24340289609477753, "2": 0.23319860651891586, "5": 0.12438467469949402, "1": 0.09489327879048072}, "score": 3.069187968690363}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28852726252834326, "4": 0.25688933241464024, "2": 0.21832707424632536, "5": 0.1476900290275741, "1": 0.08855821027200501}, "score": 3.1568271646481985}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3199018336805854, "2": 0.3009829079695083, "4": 0.17766647895916127, "1": 0.13357181576200314, "5": 0.06786892550875089}, "score": 2.7452757429790062}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3054054319530553, "2": 0.28830120346409394, "4": 0.19006035488016715, "1": 0.1355396312333227, "5": 0.0806850157004006}, "score": 2.7920481812972144}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3205734999167024, "2": 0.3127516668478245, "4": 0.16999052139267568, "1": 0.13698256829118816, "5": 0.05969254146338954}, "score": 2.70265606470413}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31204901629578113, "2": 0.26618114652589886, "4": 0.21336588862702363, "1": 0.11285531261988985, "5": 0.09554204180909921}, "score": 2.912557623873821}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3179444172504028, "2": 0.28564080045044427, "4": 0.19764035278862158, "1": 0.1194918632364923, "5": 0.07927360148699968}, "score": 2.8315615188240795}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27030508863453684, "4": 0.2455589839786549, "2": 0.21975855776273182, "5": 0.15441079932849724, "1": 0.10995321740192485}, "score": 3.114717121874597}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2726888165652358, "4": 0.26135840876396527, "2": 0.20899482251075233, "5": 0.16289763200085844, "1": 0.09404425590567805}, "score": 3.1900733918307265}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2789168695950188, "4": 0.25552168503613987, "2": 0.21701858151635792, "5": 0.15377096867017498, "1": 0.09475939350871238}, "score": 3.1565282107073065}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.27264941587801034, "3": 0.2645367224713494, "2": 0.19550150526913304, "5": 0.18397395137666753, "1": 0.08332784599633983}, "score": 3.2784430614521853}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27777076271693263, "4": 0.2487651998215516, "2": 0.22481822324297956, "5": 0.14200082663849053, "1": 0.10663400733221619}, "score": 3.094681654819155}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31558898259959767, "2": 0.26962933406064155, "4": 0.21406178300433545, "1": 0.115652473815195, "5": 0.08505992252369989}, "score": 2.883246470242622}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3186908717847321, "4": 0.25633625507438434, "2": 0.22763561689027376, "5": 0.11363792290662508, "1": 0.08368913656948124}, "score": 3.088599114283588}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3257962803020981, "2": 0.24811666997336226, "4": 0.24457907676627344, "5": 0.09827417524764409, "1": 0.08322653930397432}, "score": 3.0265578714480816}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3364786766360989, "2": 0.26363705853157327, "4": 0.22836784381797343, "1": 0.0872296136187991, "5": 0.08427778262625904}, "score": 2.958826751722253}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31323135754552317, "4": 0.2717744186445649, "2": 0.2207298993094018, "5": 0.12154362829965096, "1": 0.07271280319323414}, "score": 3.148707343296191}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2790019522146852, "2": 0.26982855585032883, "4": 0.19676422390307863, "1": 0.1487859921189573, "5": 0.10560775213870335}, "score": 2.840577350941625}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2756045584183275, "2": 0.24501464370477682, "4": 0.21542647735876058, "1": 0.13462361922652027, "5": 0.1293112875039733}, "score": 2.9597863895103966}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27607284967371126, "2": 0.2673662333398101, "4": 0.20196919362867757, "1": 0.15015747533667917, "5": 0.10442091378339013}, "score": 2.843127745410353}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2831899514387173, "2": 0.2768240979389614, "4": 0.19232219777537746, "1": 0.15204423207117926, "5": 0.09560400179696399}, "score": 2.8026145760677763}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2749802505709781, "2": 0.2632973966288211, "4": 0.20258607925841873, "1": 0.14986675195142962, "5": 0.10925675677588759}, "score": 2.858066880528577}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2718119532834869, "3": 0.25261492128669644, "1": 0.21195845298539728, "4": 0.16834202601754206, "5": 0.09526421855003923}, "score": 2.6631387648383376}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.25391523198681587, "2": 0.24586425605609738, "4": 0.19146941421700814, "1": 0.18117970408637518, "5": 0.12755830816256572}, "score": 2.8383602511777912}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26536050002981987, "2": 0.24754707822784083, "4": 0.19760845620980466, "1": 0.16687849603910518, "5": 0.12259496804511898}, "score": 2.861492867468499}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.25072797311664957, "2": 0.2451862875538422, "4": 0.1935292722840325, "1": 0.1794929944408684, "5": 0.1310534137937903}, "score": 2.851462329323705}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2590105459908938, "2": 0.25857962639243853, "4": 0.18434298640899, "1": 0.18328209688858152, "5": 0.11477598578913077}, "score": 2.788749287571955}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3004470340329908, "2": 0.2534369258816879, "4": 0.2307481552993834, "5": 0.10896509253686162, "1": 0.10639119066543906}, "score": 2.982458829655185}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2990686001401708, "4": 0.24430974793998902, "2": 0.23859023413921449, "5": 0.1201103710702975, "1": 0.09790472177659473}, "score": 3.050131630783731}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30913966930012404, "4": 0.24816676978643587, "2": 0.2388759498696221, "5": 0.11210613752015068, "1": 0.09169945894589429}, "score": 3.0501047790530915}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30869831680981985, "4": 0.2635842573169676, "2": 0.22280043912341577, "5": 0.1298223502016513, "1": 0.07507868365370787}, "score": 3.1502735485874966}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30235374682390814, "4": 0.263287417846588, "2": 0.22020525286617387, "5": 0.13788743708010553, "1": 0.07625376405936729}, "score": 3.166351570674561}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28158078277877713, "2": 0.2377125282173651, "4": 0.21878648042312943, "5": 0.13467171537276829, "1": 0.12723883093712648}, "score": 2.995939681845154}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28721813489980624, "2": 0.247801142307875, "4": 0.2088036379485907, "1": 0.1366072989850855, "5": 0.1195591800084907}, "score": 2.926905482458026}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.292518870459423, "2": 0.252821998781262, "4": 0.2071146239675393, "1": 0.13377553440339987, "5": 0.11375818132513667}, "score": 2.9142569937715486}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29126828353113365, "2": 0.2413856299626617, "4": 0.21594664839032274, "1": 0.12943479993943308, "5": 0.12195575060493122}, "score": 2.959602560723527}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2818988670072944, "4": 0.23244384732647494, "2": 0.22916775248600413, "5": 0.13839041416650316, "1": 0.11809130293772681}, "score": 3.0438746602257023}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2880855195624045, "2": 0.28432816424540613, "4": 0.18010162573405838, "1": 0.15601874791674789, "5": 0.09145421632127843}, "score": 2.766641661886478}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.288957806441742, "2": 0.26633040951114695, "4": 0.2073890668211074, "1": 0.12779843280315548, "5": 0.10951464438412409}, "score": 2.9044901597533395}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2998025762864986, "2": 0.2637807271328348, "4": 0.20918498976727704, "1": 0.12556001845837408, "5": 0.10166356497000324}, "score": 2.8976105239085648}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3001666675774432, "2": 0.28738908054135676, "4": 0.1951758171947091, "1": 0.1277540688893073, "5": 0.08950419350450863}, "score": 2.831285269668139}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29779915387165967, "2": 0.2617088637841328, "4": 0.2123210421536719, "1": 0.12705331213706045, "5": 0.10110849811096308}, "score": 2.898721625651609}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2868588775523118, "2": 0.25065462084367646, "4": 0.21791794197781203, "1": 0.12807483979836648, "5": 0.11648386656346656}, "score": 2.9440808236779086}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29943078199705997, "2": 0.2559521413067607, "4": 0.22537991265578602, "1": 0.11468851392607626, "5": 0.10453785754755626}, "score": 2.9491259095299673}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30610992791171404, "2": 0.25504150050172236, "4": 0.22908041038721813, "1": 0.10884251043085377, "5": 0.10091431384391471}, "score": 2.958182042624589}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2917118730466655, "2": 0.2502669827381229, "4": 0.22281380755081198, "1": 0.12057284329753123, "5": 0.11462538381162395}, "score": 2.9606515473939723}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3094768461985071, "2": 0.2739821282736438, "4": 0.20864740690234929, "1": 0.12101545672678192, "5": 0.08686990711085411}, "score": 2.866373076334942}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2864876930343718, "2": 0.27249026235347246, "4": 0.19425032823118066, "1": 0.1514298193461731, "5": 0.09533125097390699}, "score": 2.8095609017069383}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27943577447539436, "2": 0.24975755791236132, "4": 0.21181936910917967, "1": 0.13710248049238033, "5": 0.12187426261754607}, "score": 2.931604653507379}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28910327550994447, "2": 0.25233404345402854, "4": 0.2129503157226542, "1": 0.13356294688788645, "5": 0.11204005922326493}, "score": 2.917569725457774}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2881770300545145, "2": 0.23700906254300538, "4": 0.22601893500759998, "5": 0.13101650124650097, "1": 0.11776632670837155}, "score": 3.015510409906096}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2860887218530491, "2": 0.2477105627691959, "4": 0.21454372826836415, "1": 0.12809915070999273, "5": 0.12354587924966688}, "score": 2.957726117103369}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2719592609018062, "2": 0.24533599494981403, "4": 0.21666400271449918, "1": 0.1368705213058319, "5": 0.12916198043735388}, "score": 2.9559105627444033}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28347852733658757, "2": 0.2550855499724213, "4": 0.21398488442135968, "1": 0.13070109244116673, "5": 0.11674146383614352}, "score": 2.9309794918074723}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2887029136655374, "4": 0.23506951501646686, "2": 0.23361998020177743, "5": 0.1431294519256512, "1": 0.09946864600545344}, "score": 3.0887719893840133}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27659810799373, "2": 0.24097077943504563, "4": 0.21440766489101734, "5": 0.13830557917760214, "1": 0.12971066017752966}, "score": 2.9906266558900056}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2788617052941421, "2": 0.2365892177774841, "4": 0.23023091395179837, "5": 0.14061954470286503, "1": 0.11368966266420763}, "score": 3.0475018856599676}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3299856864025635, "4": 0.3048343087464852, "2": 0.1996058513806793, "5": 0.12584733923202007, "1": 0.03971588283045815}, "score": 3.2774944035734155}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3387030209324259, "2": 0.2812990895701768, "4": 0.2224236460700725, "1": 0.08729927682171884, "5": 0.07026369803178631}, "score": 2.907052351532592}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3435539912170446, "4": 0.30107333681679516, "2": 0.19455336176580362, "5": 0.12595713856760554, "1": 0.03484944734526188}, "score": 3.288739031494125}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.32018260670235116, "4": 0.31597647954027, "2": 0.17251781025247143, "5": 0.15786195979700401, "1": 0.03345060854157964}, "score": 3.3922855045916847}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3184167562446868, "4": 0.29640785042400586, "2": 0.19494373510042717, "5": 0.14206837829415017, "1": 0.04815137907128353}, "score": 3.2893015567082116}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2922506659303643, "2": 0.27548775440437373, "4": 0.1984040640932873, "1": 0.14022579978787117, "5": 0.09362313099633293}, "score": 2.8297095101981227}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2925872108494091, "2": 0.2545010798436428, "4": 0.2176253005172172, "1": 0.1247257065984414, "5": 0.11055228527769845}, "score": 2.9347768290542944}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.310518561502247, "2": 0.2855327058656644, "4": 0.1989044142609906, "1": 0.12331095801140517, "5": 0.08172523915809042}, "score": 2.830198891699663}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3047167568249471, "2": 0.26061866335261025, "4": 0.21889813376578707, "1": 0.11223167694802273, "5": 0.10352704459240598}, "score": 2.9408697489493596}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30309787676719757, "2": 0.27149626407931576, "4": 0.20768908525718238, "1": 0.12391728405945002, "5": 0.0937931456250338}, "score": 2.8759437572699524}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2998487794233646, "2": 0.2560602527221532, "4": 0.21883954257815832, "1": 0.11530649753490323, "5": 0.10993058036502469}, "score": 2.9520267672262204}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28606331830248294, "2": 0.23473952120369504, "4": 0.22819530861088375, "5": 0.1321176850743561, "1": 0.11886584199888812}, "score": 3.0199598393183815}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.310745944301218, "4": 0.25937857628642197, "2": 0.22727375930330124, "5": 0.11999922434651775, "1": 0.08259397855188899}, "score": 3.1069162192003392}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3172505940155349, "2": 0.24026893992591744, "4": 0.2396441893671218, "5": 0.1131094890198122, "1": 0.0897167314998364}, "score": 3.046161228686401}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2975997845445824, "2": 0.23969574237658212, "4": 0.23200357452480874, "5": 0.12315886150508831, "1": 0.10753154850548503}, "score": 3.023562705285891}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2737876973821927, "2": 0.2590939089969819, "4": 0.19342084886292465, "1": 0.16459904379844442, "5": 0.10908400560074244}, "score": 2.8232943020580605}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2810854959148797, "2": 0.26969723527536216, "4": 0.19868105077023535, "1": 0.1479454580248285, "5": 0.10257758909274756}, "score": 2.8382459471807073}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2869005611754621, "2": 0.25070300185411665, "4": 0.21615455386774543, "1": 0.13170261693567265, "5": 0.1145273980880556}, "score": 2.931100296611276}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2756462329780776, "2": 0.23394280887819796, "4": 0.2272079503522031, "5": 0.13469226784464794, "1": 0.12850170580344378}, "score": 3.0056463165660467}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2894782251989898, "2": 0.252879724632739, "4": 0.2199690333581481, "1": 0.12359497377947533, "5": 0.11407034037880949}, "score": 2.9480396416915275}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3099839676805003, "2": 0.24530778293261687, "4": 0.2297747035302319, "5": 0.11319268901181694, "1": 0.10172491710375992}, "score": 3.0074025824089765}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30727105672869, "4": 0.259409340409846, "2": 0.21559140634390972, "5": 0.14420031062606634, "1": 0.07351416281245622}, "score": 3.185192771108191}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3186924333738298, "4": 0.2641110817837296, "2": 0.22386573593103876, "5": 0.1250970178403551, "1": 0.06822285861375989}, "score": 3.153995338613622}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30259527270712283, "4": 0.25880518028462035, "2": 0.2164432479679433, "5": 0.14572418322102657, "1": 0.07642360993400223}, "score": 3.1809646181550084}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30808803775045684, "2": 0.24149886637497725, "4": 0.23320511285080067, "5": 0.12353110404608339, "1": 0.09366631057632245}, "score": 3.051436377015622}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31728676264482536, "2": 0.2552132012023651, "4": 0.2316670656168072, "1": 0.09840941486289062, "5": 0.09741347800814056}, "score": 2.974461733338847}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30073127111448505, "4": 0.24344904965909672, "2": 0.2417172075431177, "5": 0.11121785983890219, "1": 0.10287873648630105}, "score": 3.0184101969876806}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3158478085257842, "2": 0.24887259005493995, "4": 0.23921383977219332, "5": 0.0991685352485069, "1": 0.0968903259952108}, "score": 2.994897633015456}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3186363484411748, "2": 0.256280687398038, "4": 0.23196260631114737, "5": 0.10207565754645387, "1": 0.09103766108536389}, "score": 2.9977578960526308}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32441095087157307, "2": 0.26388662996998336, "4": 0.22683588421524736, "5": 0.09392616350522012, "1": 0.09093362811066458}, "score": 2.968934115546948}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "human", "scores": {"2": 0.26056388706676287, "3": 0.2374299135263444, "1": 0.2236522474932412, "4": 0.16100742452481148, "5": 0.11733091535903371}, "score": 2.687795999051465}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.24986140371203952, "3": 0.2477793863226821, "1": 0.19276073002398295, "4": 0.18168426611174712, "5": 0.12790109615851705}, "score": 2.8021009986947787}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.26546905467224313, "3": 0.24800333136102914, "1": 0.21849011625510859, "4": 0.16174308462381476, "5": 0.10627723230189914}, "score": 2.671842624043533}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2627170451307094, "2": 0.2621119176048294, "4": 0.18287893544684763, "1": 0.1764175765618357, "5": 0.11586244621434429}, "score": 2.7996543371634726}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.25458131122781136, "3": 0.2466691534373695, "1": 0.20321513150141465, "4": 0.17419016051489897, "5": 0.12132678151187277}, "score": 2.7558278856217573}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27472573671705036, "2": 0.2562210578202509, "4": 0.18533925916480512, "1": 0.174817588519797, "5": 0.10888198388124005}, "score": 2.797244077674726}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27297979432441233, "2": 0.2713611740086362, "1": 0.18519241746904247, "4": 0.17248337913388495, "5": 0.09796496149578586}, "score": 2.726662298323592}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28192849613520027, "2": 0.26179170774888627, "4": 0.18586096217237866, "1": 0.1609394776321201, "5": 0.10946226510837247}, "score": 2.82111177196097}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2866750599316422, "2": 0.2547072328177607, "4": 0.20319546122874185, "1": 0.14445065754799263, "5": 0.11095820279272296}, "score": 2.8815017327204195}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2783374367760786, "2": 0.25899749218833445, "4": 0.19517035234833588, "1": 0.15419792106693267, "5": 0.11328496732778595}, "score": 2.8543452295431653}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28003908395513244, "4": 0.23680726418165476, "2": 0.23167044798065636, "5": 0.13736260469898665, "1": 0.11411197224128505}, "score": 3.05163852659899}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28387479520027603, "2": 0.2379879111709644, "4": 0.23632105403659423, "5": 0.12736631172140248, "1": 0.11443923449053835}, "score": 3.024187555974091}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30039019483130974, "4": 0.24251012909815295, "2": 0.23691453848203428, "5": 0.1237003339389538, "1": 0.09647508408363854}, "score": 3.0600466739543544}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28746720350987837, "4": 0.23688750807530756, "2": 0.2344051618446981, "5": 0.13039547904381418, "1": 0.11083335633727485}, "score": 3.0416070614368844}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2730341773158078, "2": 0.237641890551256, "4": 0.22400011807650091, "5": 0.13584531911210854, "1": 0.1294698556295829}, "score": 2.9991091467939346}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2751593760270684, "4": 0.24340228758829796, "2": 0.22558999697298934, "5": 0.13871606955625382, "1": 0.11712521532555634}, "score": 3.0609944293637255}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2940550747810888, "2": 0.2491646390526135, "4": 0.24090840017559342, "5": 0.11581267081621614, "1": 0.10005046202720388}, "score": 3.0232683823725823}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26924447045489386, "2": 0.2495515180338669, "4": 0.22348202348450363, "1": 0.1315914805037438, "5": 0.12612425590358736}, "score": 2.962995824914305}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28823965772739557, "4": 0.24780225741552442, "2": 0.23441228786993326, "5": 0.13370326163446924, "1": 0.09583778081359454}, "score": 3.0891213549183054}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27127801455364003, "4": 0.267592841990566, "2": 0.21305937420089222, "5": 0.16114653059398626, "1": 0.0869187591036403}, "score": 3.202989920075339}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2896422031438929, "2": 0.25587516248085146, "4": 0.21856918028098948, "1": 0.13048971077027707, "5": 0.1054125057008533}, "score": 2.912538624803317}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.32113579754468957, "2": 0.2591619819078609, "4": 0.21398009121363276, "5": 0.10350658966940744, "1": 0.10220241207238466}, "score": 2.9574259056044756}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30696820608470066, "2": 0.25042214629424286, "4": 0.22360863955689197, "5": 0.11407442417009449, "1": 0.10491864905704244}, "score": 2.991497976026579}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29204998787870406, "4": 0.2396461544575315, "2": 0.23294917086704375, "5": 0.1270778993316933, "1": 0.10826842702798202}, "score": 3.0443162987015358}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29644573376798417, "2": 0.24885173540571534, "4": 0.22452655358930082, "1": 0.11737000479692429, "5": 0.11279658671441394}, "score": 2.966527667856438}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2636061093576538, "4": 0.26284349499422355, "2": 0.20165751314765581, "5": 0.16800467039416872, "1": 0.10386976751244503}, "score": 3.1894592821095253}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.30737877411044184, "3": 0.26476135656260474, "5": 0.20560568397303922, "2": 0.16463410712888563, "1": 0.057606561663461425}, "score": 3.4387488419764467}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.298233274013744, "3": 0.26497756949326845, "5": 0.18666699966556005, "2": 0.17699655674776243, "1": 0.07311154429521885}, "score": 3.3483525243746572}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.30713597934398573, "5": 0.2453746138746488, "3": 0.24129413801373753, "2": 0.14889763835933337, "1": 0.05728167009891475}, "score": 3.534432758248285}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2912882069631008, "3": 0.2662655925780127, "2": 0.18719157898592578, "5": 0.18217992160167282, "1": 0.07306155309785947}, "score": 3.322337602684232}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2949410420718573, "2": 0.2519864406154284, "4": 0.21288829232982992, "1": 0.12868712605965027, "5": 0.11147823599550459}, "score": 2.926482684834308}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3000758508850928, "2": 0.2702652486007547, "4": 0.19256939436644227, "1": 0.14081155103814358, "5": 0.096263158834045}, "score": 2.8332048934111373}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31039565153538157, "4": 0.23490615148137178, "2": 0.23313679376197063, "5": 0.12378753628641898, "1": 0.09775958780158235}, "score": 3.0538260232780345}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29449648837068754, "2": 0.23410398078384764, "4": 0.23025308625639127, "5": 0.12967940367498673, "1": 0.11145147328403414}, "score": 3.0326054738444035}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30367506935810323, "2": 0.25452347692412614, "4": 0.21416680606369876, "1": 0.11953692016162917, "5": 0.10808060366417317}, "score": 2.9367296127134135}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30330132369131807, "2": 0.30233330840144934, "1": 0.16461861578828377, "4": 0.15579862048209464, "5": 0.07393609056087756}, "score": 2.6720963133126285}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.30649994593520424, "3": 0.30176768880305166, "1": 0.1705148481715822, "4": 0.1503132994665227, "5": 0.07088607274006514}, "score": 2.6445493530576796}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2895214764766245, "2": 0.27099795615346745, "4": 0.18187904513711303, "1": 0.15575613999076743, "5": 0.1018306744018109}, "score": 2.803027260762157}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28281474697909564, "2": 0.24575496910414446, "4": 0.2025859779654044, "1": 0.1403020472548198, "5": 0.1285273187456553}, "score": 2.933280555057701}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.29894517009974597, "3": 0.2885700831513141, "1": 0.16612610671991884, "4": 0.16225582867600769, "5": 0.08409022074808785}, "score": 2.699235099820566}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2943973480942553, "2": 0.25344242552265045, "4": 0.21466304774902314, "1": 0.12659576774058712, "5": 0.11089155912624715}, "score": 2.9298115135170617}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31019451826839056, "2": 0.2612209442683207, "4": 0.21488677875592666, "1": 0.10772241414414457, "5": 0.10596316979612463}, "score": 2.9501467388397224}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30060727510801133, "2": 0.276887525605161, "4": 0.20044365383213705, "1": 0.12480608078437784, "5": 0.09724209355444353}, "score": 2.8684263944811828}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31608658492498615, "2": 0.28328466599386937, "4": 0.19814480048256877, "1": 0.1118281456438329, "5": 0.09064448337034059}, "score": 2.872491366596977}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29795652272997386, "2": 0.29207875621932766, "4": 0.1805333777539593, "1": 0.1435951208949374, "5": 0.08582390484895133}, "score": 2.772909392242097}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2705276683431046, "2": 0.2464338447045177, "4": 0.2029713181143148, "1": 0.15532488863704427, "5": 0.12473090776885017}, "score": 2.895348321529294}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.281961596483599, "2": 0.24217942546639146, "4": 0.2200997117681723, "1": 0.13101930502962802, "5": 0.12472772717125485}, "score": 2.965336706511496}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.287634385537105, "2": 0.24310802186351105, "4": 0.21893633482307448, "1": 0.12940930379529766, "5": 0.1208975241579431}, "score": 2.958804159236161}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30413791885916464, "2": 0.23609110743515793, "4": 0.2329994467226866, "5": 0.12300404967066005, "1": 0.1037532079862454}, "score": 3.035410527940728}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29345147076856926, "2": 0.24929426328724494, "4": 0.21687873641563069, "1": 0.12115222090818627, "5": 0.11921206655333005}, "score": 2.9637037563738695}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3355305394622385, "4": 0.30054111872753686, "2": 0.2034063248961226, "5": 0.12061266302426317, "1": 0.03989722924415271}, "score": 3.258568796446677}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3868588427132076, "3": 0.26036111701916337, "5": 0.22911232351108257, "2": 0.10738298885519637, "1": 0.01627312345238772}, "score": 3.705162436996911}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3396491859770457, "4": 0.30338541047213463, "2": 0.19436265681137888, "5": 0.12677003271065768, "1": 0.035821639961302}, "score": 3.2909227608577516}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.33279589661297315, "3": 0.31181753062417006, "2": 0.16574883145272354, "5": 0.15651264085928984, "1": 0.03311336505496297}, "score": 3.413850473468045}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.33559473259431494, "4": 0.30424234733083055, "2": 0.19613599663083972, "5": 0.12685877742770343, "1": 0.03715756108479625}, "score": 3.287511826678801}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2950543801910799, "2": 0.2599726879059391, "4": 0.20399536622076384, "1": 0.13473012169012846, "5": 0.10623770452410534}, "score": 2.8870367437807616}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2939150496985911, "2": 0.26780978712401005, "4": 0.1934783420822759, "1": 0.14548101237896247, "5": 0.0993058100075134}, "score": 2.833316483595451}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29698326160498384, "2": 0.26258616583840466, "4": 0.20253734291096687, "1": 0.1350569820957926, "5": 0.10282808118347378}, "score": 2.8754923584729073}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29829686412622886, "2": 0.24842618992499035, "4": 0.22142058201448667, "1": 0.1219046618492695, "5": 0.10994445447970498}, "score": 2.9490736082559796}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29155975580930876, "2": 0.25317867859967164, "4": 0.21286300270293476, "1": 0.13407827604374378, "5": 0.1083132810990939}, "score": 2.908153690762119}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2953468649439925, "4": 0.2748711600525417, "2": 0.19742606878257535, "5": 0.15854192652210872, "1": 0.07380354598151427}, "score": 3.24692442869083}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3037404272652877, "4": 0.25359831519347176, "2": 0.20942673801319542, "5": 0.15182002586914561, "1": 0.08140240996192896}, "score": 3.1850090445879413}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3051802479645111, "4": 0.23215605095629457, "2": 0.2318202018043908, "5": 0.13034304452743084, "1": 0.10048566484651068}, "score": 3.0600514966694266}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3031565015653996, "4": 0.28066553092545415, "2": 0.20343921835822304, "5": 0.14341063362134385, "1": 0.06931975142826526}, "score": 3.2254099623051498}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2929930178829578, "4": 0.26698136954538265, "2": 0.2056907195032463, "5": 0.15466911280492066, "1": 0.07965526046887292}, "score": 3.2113205777633085}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31313145267813974, "2": 0.29708389658061785, "4": 0.17392458382796316, "1": 0.147285308369863, "5": 0.06856002774573113}, "score": 2.7193859923309063}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31133916448113735, "2": 0.25558871716500425, "4": 0.22936533438090642, "1": 0.10196017327853894, "5": 0.10173812185496982}, "score": 2.973332287990839}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31621917944183026, "2": 0.27596437436058463, "4": 0.20695404814454388, "1": 0.1138155640438153, "5": 0.08703884201661989}, "score": 2.877435250192994}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30661591679925737, "4": 0.26519104187309855, "2": 0.22508015404864432, "5": 0.12345589650673944, "1": 0.07964878475943794}, "score": 3.127726159441559}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3146533884869883, "2": 0.2548262343568557, "4": 0.23185602079251516, "1": 0.10195425975998251, "5": 0.0967000944298094}, "score": 2.966521120913744}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "human", "scores": {"1": 0.32498833162149804, "2": 0.30587532337712475, "3": 0.21273859935819525, "4": 0.09946733302799182, "5": 0.05691809353981473}, "score": 2.257442385864281}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3111368908940627, "1": 0.2862803223834505, "3": 0.22938689573570603, "4": 0.10704248149450515, "5": 0.0661377956850139}, "score": 2.3556104758297374}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.30914455374548594, "1": 0.29896869801044396, "3": 0.22056344346840046, "4": 0.1082503585353687, "5": 0.06306472493900642}, "score": 2.327292328114554}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.29698127182379686, "1": 0.2496063006042425, "3": 0.24084338777220454, "4": 0.1322941402798111, "5": 0.08026417476371903}, "score": 2.4966232181816927}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.30656903880949243, "1": 0.259750402353789, "3": 0.23599487270943845, "4": 0.12634763034666274, "5": 0.07132863637546841}, "score": 2.442929812310735}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2774538682931937, "2": 0.2457472279445416, "4": 0.21486316399659616, "1": 0.13281388389531792, "5": 0.12911122975220485}, "score": 2.961710220894112}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28496320850830925, "2": 0.2409739602703276, "4": 0.2286972277047459, "5": 0.13069330288818828, "1": 0.1146615194272752}, "score": 3.0197870476843853}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2886504611115832, "2": 0.2522412520582299, "4": 0.21964730020187279, "1": 0.1197661964074589, "5": 0.11968581237113156}, "score": 2.967244986001395}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2914453993495909, "2": 0.2486885422005128, "4": 0.2220373651025196, "1": 0.12001801769653131, "5": 0.11780020117484762}, "score": 2.968912864237182}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29478102099397185, "2": 0.256327180931568, "4": 0.22853285349763494, "1": 0.11204537004793769, "5": 0.10830416150476567}, "score": 2.96472292341575}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2626183346140172, "2": 0.25379475240978, "4": 0.2057814696931021, "1": 0.15680310013376844, "5": 0.12098976787228724}, "score": 2.8803585482359577}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.25515560608270743, "2": 0.24138946802469066, "4": 0.2073336391317868, "1": 0.15861446018648437, "5": 0.13749472860893103}, "score": 2.923703784923019}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26257876101293653, "2": 0.2406806807956279, "4": 0.21098593637048815, "1": 0.14650208771679019, "5": 0.13923870730725693}, "score": 2.955777883305568}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2590057284395417, "4": 0.22771669236808043, "2": 0.22404478815350398, "5": 0.15718693706354042, "1": 0.13203084624781236}, "score": 3.0539848960366434}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2588191820236174, "2": 0.2584886482304575, "4": 0.19569516716600152, "1": 0.17092291732271966, "5": 0.1160599512803057}, "score": 2.8274781484308513}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.281357183830199, "2": 0.2564201163781877, "4": 0.20457091315781253, "1": 0.143644540478189, "5": 0.11399037089367933}, "score": 2.8888405817663063}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3067588944651735, "2": 0.24327614054255148, "4": 0.23750561824946828, "5": 0.11515138787854706, "1": 0.09729640870286245}, "score": 3.029939781867599}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30542565046187586, "2": 0.25464763829811204, "4": 0.2201829472038594, "1": 0.11192303851534564, "5": 0.10780586669031318}, "score": 2.9573003307885353}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30451388302937443, "4": 0.25237431918128134, "2": 0.22774909875906446, "5": 0.12992279364376966, "1": 0.08543018383006161}, "score": 3.1136115445306762}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29743082560737066, "2": 0.23945686086602702, "4": 0.23280157446079022, "5": 0.1261485750044116, "1": 0.10415087603799178}, "score": 3.0373405330284142}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3086890559992284, "1": 0.2666914518136996, "3": 0.23634178030186664, "4": 0.12084240745449049, "5": 0.06742385445603791}, "score": 2.413611442605806}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.29867621061551386, "3": 0.25554682960704006, "1": 0.21736928448377546, "4": 0.1470146260814784, "5": 0.08138422669469002}, "score": 2.57636456235673}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.31075371304693444, "1": 0.26960773761593243, "3": 0.23359991310737216, "4": 0.11897323822826542, "5": 0.06705693126674461}, "score": 2.4031128587978543}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2895906803790394, "3": 0.2552009767828047, "1": 0.2058030367212185, "4": 0.1580763238895903, "5": 0.09132087277868262}, "score": 2.6395183923183874}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.30856400053168626, "3": 0.2502829502809808, "1": 0.2355032653539319, "4": 0.1337911067818993, "5": 0.07184840972254217}, "score": 2.497912239887234}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31352135600538783, "2": 0.28706807391685774, "4": 0.18541650612738597, "1": 0.13529030526421798, "5": 0.07869214011659106}, "score": 2.7851496056610228}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31239623904422686, "2": 0.2772617425490608, "4": 0.19963559486836982, "1": 0.12510044554560326, "5": 0.08559794526808928}, "score": 2.8433675935792886}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30843739184774704, "2": 0.270719432182797, "4": 0.20288829953068335, "1": 0.12369851555741004, "5": 0.0942462444624657}, "score": 2.8732630430338513}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3109747996967472, "2": 0.2821721311809891, "4": 0.19422668940468668, "1": 0.1307864419693674, "5": 0.0818283105914976}, "score": 2.814136134399665}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3111790839170902, "2": 0.27973993807423697, "4": 0.19720830955471016, "1": 0.12640869627398615, "5": 0.08545234729422414}, "score": 2.8355537618522186}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "human", "scores": {"2": 0.25847613768264077, "3": 0.23718878351805736, "1": 0.21247923777060276, "4": 0.16559929405383464, "5": 0.12623841214869458}, "score": 2.7346366928099295}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.23985984629261914, "3": 0.22664988703659808, "1": 0.20660888859767992, "4": 0.17771573493369142, "5": 0.14914698243091457}, "score": 2.822928772032973}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.24446268482921138, "3": 0.23681304234939415, "4": 0.18729310178039435, "1": 0.1843320736272161, "5": 0.14708404807222297}, "score": 2.8683323843302757}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.23737580941444947, "2": 0.22493115530956057, "4": 0.21626343671547313, "5": 0.1717942395449907, "1": 0.14962169558392496}, "score": 3.035677856810001}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2464242339719847, "2": 0.24054783766648083, "4": 0.19575433475776668, "1": 0.1716483623086261, "5": 0.14561024233300182}, "score": 2.903128805141365}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29298648421150975, "2": 0.26906674701290406, "4": 0.2021029212902277, "1": 0.1319324803187206, "5": 0.10389607066741807}, "score": 2.876961472915985}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3111383221270526, "2": 0.299820954747719, "4": 0.18222350425119702, "1": 0.13389067101455918, "5": 0.07291473749310055}, "score": 2.760447853261943}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2875370090209367, "3": 0.2870559024885598, "4": 0.18318111795228784, "1": 0.14884737900088033, "5": 0.09336829923297627}, "score": 2.7846837332949925}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.293080372121091, "2": 0.27208115315453596, "4": 0.19928028059205966, "1": 0.13687963718610632, "5": 0.09866539518970961}, "score": 2.850768679298425}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28760059048230274, "2": 0.270356181124377, "4": 0.20162337542052006, "1": 0.1369468752848922, "5": 0.10346308464450742}, "score": 2.8642982705122746}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30373395766308847, "2": 0.29346681868183483, "4": 0.1806483418914399, "1": 0.14394879973895686, "5": 0.07819018115437627}, "score": 2.755661378198196}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29683068111575966, "2": 0.2902473176391952, "4": 0.18463534632975256, "1": 0.1440846074803969, "5": 0.0841922167209482}, "score": 2.774601031338875}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30331336499288686, "2": 0.28605668171048304, "4": 0.1886407436567677, "1": 0.13610341197786174, "5": 0.08587175642851046}, "score": 2.802117972339828}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3075166029068919, "2": 0.25740573591920535, "4": 0.21765180889314753, "5": 0.10874658628378134, "1": 0.10866676297618726}, "score": 2.9604052245348296}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29503626440829633, "2": 0.2905003784317412, "4": 0.18534841515035883, "1": 0.14760052646294577, "5": 0.08150328115297568}, "score": 2.762650903360396}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2840327018757687, "2": 0.2384425209513218, "4": 0.23396447298533277, "5": 0.12597094422652885, "1": 0.117570902717975}, "score": 3.0123222624861126}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2982663499178571, "2": 0.2590656433934271, "4": 0.21747588677537408, "1": 0.1185216067008135, "5": 0.10666075449520913}, "score": 2.9346879016084326}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30082673836978874, "2": 0.24771353531378432, "4": 0.22691749175903642, "5": 0.11763120853797951, "1": 0.10690177038033614}, "score": 3.0006628388955363}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30842153857323873, "4": 0.24506120090987513, "2": 0.2356051896665853, "5": 0.1223428046971676, "1": 0.08855829883025958}, "score": 3.0770258677446676}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2914504122535706, "2": 0.25285069570664337, "4": 0.21811147362121688, "1": 0.12195036027988154, "5": 0.11562401524335997}, "score": 2.9526074697057187}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2640398342255922, "2": 0.2495753263843276, "4": 0.1993666673843339, "1": 0.16956729674730764, "5": 0.11743746498113541}, "score": 2.845529605976843}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2657611515717093, "4": 0.22949537550260593, "2": 0.22767944096445697, "5": 0.14275588576750456, "1": 0.13429516199047464}, "score": 3.018737625385345}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26411187411816356, "2": 0.23043674024599756, "4": 0.22450482047081333, "5": 0.14088598961152762, "1": 0.14004981475262904}, "score": 2.9957403841057344}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2627536967148938, "4": 0.23361998020177743, "2": 0.22027967279365598, "5": 0.15436803346042943, "1": 0.12896724778452534}, "score": 3.064142608000108}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27248227850574946, "2": 0.23653043266121956, "4": 0.22213917036266548, "1": 0.13939373838404134, "5": 0.12944145305913365}, "score": 2.9657037237027346}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2989670835838336, "4": 0.2548917840936671, "2": 0.22192783888891685, "5": 0.13425477208069483, "1": 0.08994907519152842}, "score": 3.1215764874142007}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31118446736180866, "4": 0.26434981397714963, "2": 0.21207342922744152, "5": 0.14237853908994164, "1": 0.07000658989546586}, "score": 3.197021693902291}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2927807920409081, "4": 0.281409915107215, "2": 0.19017845705135522, "5": 0.16802054758570648, "1": 0.06759959412630404}, "score": 3.2920764884664844}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3035978242464534, "4": 0.2731792789170428, "2": 0.20261503087768867, "5": 0.1507638309481967, "1": 0.0698328883768667}, "score": 3.232428723979873}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29938515222296075, "4": 0.2647002831627333, "2": 0.21058150576894455, "5": 0.14388979282830713, "1": 0.08143501001297238}, "score": 3.1790298210953916}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28181053374491954, "2": 0.26694367443734013, "4": 0.20162807329989746, "1": 0.14079666804377897, "5": 0.10881085274940246}, "score": 2.8707114498247677}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2857658242179266, "2": 0.2401662228896726, "4": 0.22706496795588724, "5": 0.1351029092768835, "1": 0.11188915334975617}, "score": 3.03332662092415}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2808375473881143, "2": 0.24236369720706055, "4": 0.220410910445465, "5": 0.13251611742634153, "1": 0.12386092690633767}, "score": 2.9953575441369793}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2788879474152828, "4": 0.25270747108182384, "2": 0.2122428374879264, "5": 0.16270399673507668, "1": 0.09344766799187648}, "score": 3.1789790950621453}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28200775737510925, "4": 0.25251927412793773, "2": 0.22074287860906888, "5": 0.15125970784979853, "1": 0.09346075158122524}, "score": 3.1473757273515997}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27040160477828595, "2": 0.25883279627064343, "4": 0.19756759500625456, "1": 0.14895700078812948, "5": 0.12422865742340118}, "score": 2.889276745046381}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27126691950973997, "2": 0.2655952886642768, "4": 0.1899612452491005, "1": 0.15322152943334957, "5": 0.11994035517186417}, "score": 2.8578015231518146}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2733113110410078, "2": 0.2619465771552186, "4": 0.19248200695241327, "1": 0.15101977356181737, "5": 0.12122517650260366}, "score": 2.8709442798668254}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27100825427146424, "2": 0.2631370447029507, "4": 0.19343941815572727, "1": 0.153396639050333, "5": 0.11900422289352841}, "score": 2.8615155440650772}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.261493539847075, "2": 0.24066722712160513, "4": 0.19943909050917122, "1": 0.15302467440063805, "5": 0.14535526932040466}, "score": 2.943431910619513}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2843614894590751, "2": 0.27312686084309373, "4": 0.19420270388968128, "1": 0.15087554308526255, "5": 0.09742223587347362}, "score": 2.814167153455596}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28585837017419014, "2": 0.2665428394205804, "4": 0.20155928953646488, "1": 0.14145078946783174, "5": 0.10457855160026273}, "score": 2.861270564917339}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2962351246338158, "2": 0.2686156853262268, "4": 0.20976387198860127, "1": 0.12657566592879602, "5": 0.09880103485917718}, "score": 2.885597938690443}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29908026404302085, "2": 0.24910477198316555, "4": 0.22844186983142234, "5": 0.11322896175996028, "1": 0.11013278553187276}, "score": 2.985529286107404}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2897437405294821, "2": 0.2699045232807149, "4": 0.20219156285445608, "1": 0.14093885995268565, "5": 0.09721278920383374}, "score": 2.8448335754096865}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2882583939140673, "2": 0.2598352766737032, "4": 0.21063946577426312, "1": 0.13746235241279037, "5": 0.10378619637429072}, "score": 2.883449742422972}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29075549161672437, "2": 0.25333070738731017, "4": 0.21945574151207717, "1": 0.1283430656505285, "5": 0.1081016814369037}, "score": 2.9256412758047015}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3015264314972042, "2": 0.2568376001127096, "4": 0.215622367492818, "1": 0.12421773820432036, "5": 0.10177667773329054}, "score": 2.9139009946321037}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2961280549902648, "4": 0.25164439978276015, "2": 0.2286245364109519, "5": 0.12581541581171402, "1": 0.09776933491837189}, "score": 3.0791134696190197}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2963681344330798, "2": 0.2611551509994697, "4": 0.21995704537250566, "1": 0.12450195006840513, "5": 0.09800362609761633}, "score": 2.9058039189233633}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32634476339757584, "2": 0.2596116807446923, "4": 0.225473239256899, "5": 0.09563155884106118, "1": 0.09292790514099164}, "score": 2.971268554100916}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31055933526611124, "4": 0.2594320656634175, "2": 0.2278336777005425, "5": 0.12676212250741745, "1": 0.07540405692834273}, "score": 3.1343156932999725}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31710174324232926, "4": 0.2604058248610139, "2": 0.22107437403152, "5": 0.1275272770012836, "1": 0.07388204825173549}, "score": 3.1466231887320246}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3215924558919144, "4": 0.2790613580538389, "2": 0.2128708149184872, "5": 0.12728759820035246, "1": 0.05917661689505973}, "score": 3.2024147638932097}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3119131485365363, "4": 0.26291184318780214, "2": 0.22408359607148087, "5": 0.1286354685494764, "1": 0.07244714626631339}, "score": 3.151206221902509}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28032088896175544, "2": 0.2711051570427046, "4": 0.1915250058566914, "1": 0.16023587990193078, "5": 0.09679965003955446}, "score": 2.7935446188301825}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2856120949924724, "2": 0.25696571696716825, "4": 0.20443142291650265, "1": 0.15136577807827276, "5": 0.10159077959232671}, "score": 2.847910506383198}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2901044350405724, "2": 0.260190818459547, "4": 0.20346717282725346, "1": 0.14260136483140826, "5": 0.10361724556785505}, "score": 2.8653055615931446}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2917955188307182, "2": 0.24958356250599353, "4": 0.2088222431815827, "1": 0.1416664398196742, "5": 0.1081146976629098}, "score": 2.892133304596051}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30607855325208183, "2": 0.2741400148526046, "4": 0.19698956917425453, "1": 0.1301145191197288, "5": 0.09266200138436406}, "score": 2.8479421859469456}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2901434276968896, "2": 0.24583794998809913, "4": 0.23861266267534825, "5": 0.11971109268421141, "1": 0.10568940792214393}, "score": 3.0208181958586087}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2954117893198347, "4": 0.2581541737142595, "2": 0.2299576770080249, "5": 0.13408349179012746, "1": 0.08238647449648671}, "score": 3.1315913726454943}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3008014699850527, "4": 0.24437826199853352, "2": 0.24326587450603548, "5": 0.11654515319424977, "1": 0.09500515744124234}, "score": 3.0441925594312043}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2988482677843137, "4": 0.25799700568499, "2": 0.22841710807484406, "5": 0.12988352391916907, "1": 0.08484809830387753}, "score": 3.1196514662987767}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29352557662040835, "4": 0.24999964028023144, "2": 0.2321912020432795, "5": 0.12827366365777917, "1": 0.09600438610156715}, "score": 3.082347448837551}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2997392646683291, "2": 0.25624660433318813, "4": 0.218269050621672, "1": 0.11846096286258598, "5": 0.10727438296719002}, "score": 2.9396486990051134}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2940892459660857, "2": 0.29365654759104176, "4": 0.1768773720130623, "1": 0.15764058747104154, "5": 0.07772846840296042}, "score": 2.7233944346940318}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29096511462811137, "2": 0.2841452295136091, "4": 0.1827740844462671, "1": 0.15679155985028626, "5": 0.08531586936452758}, "score": 2.755675484622756}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2973825267632643, "2": 0.2571933351646772, "4": 0.21244662471072134, "1": 0.12626959688765205, "5": 0.10669961808664513}, "score": 2.9161126358142146}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30578556214281905, "2": 0.26382393795480885, "4": 0.20954912085809105, "1": 0.12098223044454208, "5": 0.0998511402056733}, "score": 2.9034622293130345}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32638908402574773, "2": 0.27720152783813345, "4": 0.21150898481570096, "1": 0.1064623901855782, "5": 0.0784241157556906}, "score": 2.8782292158230347}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3087194324968379, "4": 0.29274328922355436, "2": 0.19821796904899316, "5": 0.1428503071714502, "1": 0.057459156805451654}, "score": 3.2653102329531145}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.30719839571627705, "3": 0.30506250162743853, "2": 0.18522290264981942, "5": 0.15440366571435604, "1": 0.04810181830433471}, "score": 3.334582773271408}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.32150631281236164, "3": 0.29759154114472214, "2": 0.178935316282228, "5": 0.16084540382470627, "1": 0.041115545211509626}, "score": 3.3820329603871064}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3132012887785227, "4": 0.27108157192000965, "2": 0.22190242960607326, "5": 0.12302884978684137, "1": 0.07077711252260702}, "score": 3.1536839611753273}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "human", "scores": {"3": 0.24408613590019781, "2": 0.23788814375751036, "4": 0.18932953703530211, "1": 0.1867440530351912, "5": 0.14192953172700334}, "score": 2.8618092277510594}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.24684637485596186, "2": 0.22995054843053114, "4": 0.20477050801896016, "1": 0.16522172818508812, "5": 0.15319791981483172}, "score": 2.9507717067841726}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.24673522028261577, "2": 0.2329119485636805, "4": 0.20278280476239002, "1": 0.16878853833240956, "5": 0.14876626440437868}, "score": 2.9298252400263456}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2555232437231726, "2": 0.245981905655735, "4": 0.197722153289962, "1": 0.1700564905121576, "5": 0.13070455606600928}, "score": 2.8730348995029096}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.25280480746985606, "2": 0.24317892249949682, "4": 0.1961390759901597, "1": 0.17405453662445483, "5": 0.13380779157319006}, "score": 2.8724647674694097}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30177278872008667, "4": 0.26868859751696106, "2": 0.2226415054443384, "5": 0.13137488830305472, "1": 0.07551235452661353}, "score": 3.157773716140358}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2999109745096245, "4": 0.29138364861219046, "2": 0.19447357234273677, "5": 0.15584630215488607, "1": 0.05837629961668743}, "score": 3.2918527671979527}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31258051343435506, "4": 0.2630495398747421, "2": 0.222049266624247, "5": 0.12385001523934319, "1": 0.07846137605929607}, "score": 3.1317787756730664}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.296052581568544, "4": 0.2806446782511928, "2": 0.20739910469485612, "5": 0.1439090753524464, "1": 0.07198415166204873}, "score": 3.2170976805920257}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30436263810463543, "4": 0.27950242785570645, "2": 0.21095576753871004, "5": 0.13559958011197426, "1": 0.06957299429090631}, "score": 3.200601154341614}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.26618250405320787, "3": 0.26377073003272267, "4": 0.18003287605850135, "1": 0.179054491084698, "5": 0.11093915290478316}, "score": 2.777615193272447}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2744954208381303, "2": 0.25860388229897835, "4": 0.19520968313677795, "1": 0.15356267332620507, "5": 0.11811464008482149}, "score": 2.865707894510874}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2824986802748513, "2": 0.25528446667633803, "4": 0.20095338766112264, "1": 0.14698474104591283, "5": 0.11426458485284643}, "score": 2.880226915068443}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2700678649231643, "2": 0.25581608772627756, "4": 0.1993609057709022, "1": 0.1602817620020559, "5": 0.11446215896501627}, "score": 2.851903950242146}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27192189626636754, "2": 0.2487711205037632, "4": 0.1896518606363042, "1": 0.16602290802435854, "5": 0.12360787776831436}, "score": 2.856047176269244}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2951568998893988, "3": 0.2838284989967369, "1": 0.1769370428135571, "4": 0.16437922055491988, "5": 0.07968335186593649}, "score": 2.674710064014512}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2896274896936979, "2": 0.26332733524479585, "4": 0.21225277068515586, "1": 0.12987354924756436, "5": 0.1049059441779376}, "score": 2.898988921152033}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.29012578751275264, "3": 0.287775792585532, "4": 0.17909007274699765, "1": 0.15807809435433248, "5": 0.08491754942648949}, "score": 2.742639926037313}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.29024409591185, "3": 0.28916217184555393, "4": 0.18529795164783108, "1": 0.14985064214151267, "5": 0.0854331568521892}, "score": 2.7662160840517185}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28249777628052086, "2": 0.2786825105893273, "4": 0.18680014069545833, "1": 0.15654782885593765, "5": 0.09546023553871333}, "score": 2.7859399800604012}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2400695754365642, "2": 0.22616159796101803, "4": 0.21517317714121814, "5": 0.1665351134840652, "1": 0.15203708616020215}, "score": 3.018008056113546}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.23345865124888998, "4": 0.21736678475137738, "2": 0.21472910973193038, "5": 0.18006252991511623, "1": 0.15435531405851885}, "score": 3.0540535991684155}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.24072241844422743, "2": 0.22721433498531166, "4": 0.2082889667901916, "5": 0.1635265526992996, "1": 0.1602208825254601}, "score": 2.987685641579081}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.23964222429282586, "2": 0.23142901109953956, "4": 0.20893595696085304, "5": 0.16169141596278558, "1": 0.15827877530768458}, "score": 2.984331872815255}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2454233991969874, "2": 0.2354018559376294, "4": 0.21177491288944714, "5": 0.15496561893340147, "1": 0.15241446889198623}, "score": 2.9814749912740868}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2712850678737112, "4": 0.24279553732767412, "2": 0.22738033021993367, "5": 0.14840803581769113, "1": 0.11011744510333384}, "score": 3.0919976382008776}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28890184073508796, "4": 0.2769094005837341, "2": 0.1991762635135837, "5": 0.16107219473537154, "1": 0.07392562195164916}, "score": 3.252029982054791}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3128032125697719, "3": 0.26300708710503695, "5": 0.22025167702641266, "2": 0.15857265492495476, "1": 0.04535175065358147}, "score": 3.5040372742290717}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2950275314641181, "3": 0.2796692567228505, "5": 0.18662102924503207, "2": 0.18053875772877762, "1": 0.05813150542773301}, "score": 3.371472249100532}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3020417880962622, "3": 0.2760443052168288, "5": 0.1905687799446273, "2": 0.17608197946091922, "1": 0.05524963195800703}, "score": 3.396603464832655}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3073816327463337, "3": 0.29058989538771496, "1": 0.16968978551153474, "4": 0.16416653648880689, "5": 0.06814927903403203}, "score": 2.6536959705263348}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30408682798055026, "2": 0.25338685169262654, "4": 0.23291588480887238, "5": 0.10785682778406898, "1": 0.10174506063148991}, "score": 2.9917524969291507}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3252927281633504, "2": 0.3025302822227732, "4": 0.188303774194797, "1": 0.1166476180913583, "5": 0.0672134098514429}, "score": 2.7869024783712035}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3103624099412213, "2": 0.2830807178279706, "4": 0.2054201058415481, "1": 0.1155244596014003, "5": 0.08560032492404478}, "score": 2.862489471026435}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30096171951862943, "2": 0.2628897858094787, "4": 0.21821200254834752, "1": 0.11534461263051111, "5": 0.10257982530856442}, "score": 2.929791795792331}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2995820926459766, "3": 0.2772806524447228, "1": 0.18434551192520354, "4": 0.16277156546081786, "5": 0.07600323300964477}, "score": 2.6464989250799404}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3090475903084863, "2": 0.25386333701724434, "4": 0.22958627366795387, "1": 0.10551035280789654, "5": 0.10198015943108053}, "score": 2.9686621648563882}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2885285031982396, "2": 0.26310936414187097, "4": 0.21157405498670956, "1": 0.1277088774945634, "5": 0.10906863674711446}, "score": 2.9111832711405095}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29221866623446024, "2": 0.25253364288342284, "4": 0.22769562954820685, "5": 0.11390315604517767, "1": 0.11363603653276179}, "score": 2.97569591292625}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28768144637205023, "2": 0.24771185086747133, "4": 0.22596661768011006, "1": 0.1208045655388291, "5": 0.11782081801397402}, "score": 2.9722868643375007}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27931379944534507, "2": 0.27315384711004465, "4": 0.1804056414403992, "1": 0.17419005600083404, "5": 0.09293060938237777}, "score": 2.744731357580709}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28403131011893934, "2": 0.24901418905110004, "4": 0.2107591429759306, "1": 0.14517085788592735, "5": 0.1110169485151451}, "score": 2.893436330472729}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2833062531078767, "2": 0.2550370373145166, "4": 0.2046803674101907, "1": 0.14388707333692197, "5": 0.11308418925700246}, "score": 2.888036993211514}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2864868049239, "2": 0.2567477997064664, "4": 0.20331042108919672, "1": 0.14002788466880917, "5": 0.11342160336139609}, "score": 2.893349473656429}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27733605865397715, "2": 0.26487729446146213, "4": 0.19532020309163006, "1": 0.1580279599345426, "5": 0.10443416563816167}, "score": 2.823254556811658}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2853568433455927, "2": 0.27849465831394926, "4": 0.18886277232409043, "1": 0.14702337371196966, "5": 0.10024514930010156}, "score": 2.81680851374248}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2777959021084988, "2": 0.25100548186229993, "4": 0.2099122274835851, "1": 0.13995443130989738, "5": 0.12131792498008975}, "score": 2.9216326332907476}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2996651183465283, "2": 0.2623880405823078, "4": 0.21879019982491146, "1": 0.1128691382424879, "5": 0.10627654150213428}, "score": 2.943216343327751}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2841446896381859, "2": 0.27905625127771366, "4": 0.19803153367172013, "1": 0.13488539324801552, "5": 0.10387334069390583}, "score": 2.8569499196652317}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30338877806888104, "2": 0.2762007009984079, "4": 0.1979316123739365, "1": 0.12988325116405522, "5": 0.09258306846487833}, "score": 2.8471286214901164}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26632202023537915, "2": 0.2447542336172444, "4": 0.20574315675049093, "1": 0.14961753615860401, "5": 0.1335508733432202}, "score": 2.9288547309605675}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2643049840503844, "3": 0.25756164228819434, "4": 0.18837035134579297, "1": 0.17331129645391813, "5": 0.11643672343669427}, "score": 2.8103133755016003}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.24578495303935802, "2": 0.24134524952468678, "4": 0.18995326704434348, "1": 0.18419717350232953, "5": 0.1387053056069029}, "score": 2.857622281139271}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2555132785109903, "2": 0.23242485743989577, "4": 0.21179401584812024, "1": 0.15108460516049596, "5": 0.14916585071758603}, "score": 2.97553122395355}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2572522649079078, "2": 0.23486746562409058, "4": 0.2132940390958743, "1": 0.1530230982546089, "5": 0.141548608205742}, "score": 2.9554769467251525}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "human", "scores": {"1": 0.2678822126819425, "2": 0.23440940461652449, "3": 0.21009518269988925, "4": 0.15130769503949443, "5": 0.13627312977906597}, "score": 2.653668912084838}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.2670806783820502, "2": 0.23445767448214713, "3": 0.2066486439721905, "4": 0.1533838156273349, "5": 0.13838901643037868}, "score": 2.661529220496317}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.2744148133708161, "2": 0.2303016287231704, "3": 0.2078975227029271, "4": 0.14683548038626487, "5": 0.14050559063549684}, "score": 2.6486996102580322}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.2804051660871946, "2": 0.2509870838347754, "3": 0.2065804198543726, "4": 0.14080738307791899, "5": 0.12118853567028777}, "score": 2.5713735746208917}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.28017412334613695, "2": 0.23307753792073288, "3": 0.20599487276347478, "4": 0.14389403763980627, "5": 0.13681448430171683}, "score": 2.624080326285842}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2867232540598197, "2": 0.2560922110358502, "4": 0.20602093276313954, "1": 0.13545113920038301, "5": 0.11569298240416503}, "score": 2.9104106628864894}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27850493495644396, "2": 0.2432236958603904, "4": 0.21490839745327178, "1": 0.1353557880852261, "5": 0.12799278293147145}, "score": 2.956958071450904}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2798818301705348, "2": 0.24247453122414922, "4": 0.20510365366421274, "1": 0.14284907866409113, "5": 0.1296637912146732}, "score": 2.9362568191409046}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2821690555215216, "2": 0.23040952727393216, "4": 0.2300608361578731, "5": 0.14311392322256464, "1": 0.11423386323668591}, "score": 3.057412163420642}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27859276140754813, "2": 0.24557605092111076, "4": 0.20784684346494228, "1": 0.13588045325427972, "5": 0.13208574288007205}, "score": 2.95468054933476}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26283952608741445, "2": 0.2512873434516398, "4": 0.19926864296349514, "1": 0.16441805151257052, "5": 0.12216855370709978}, "score": 2.863479862609895}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27442200313311194, "2": 0.2453132533571713, "4": 0.21417425919823355, "1": 0.13746110151107502, "5": 0.1286123805550813}, "score": 2.9511627335858894}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27244734851670516, "2": 0.2436084392166415, "4": 0.21410023195317526, "1": 0.13732423094829638, "5": 0.13250901475280083}, "score": 2.960860940202906}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27656602447408285, "2": 0.2362271350852429, "4": 0.22818143475788957, "5": 0.13565202660948028, "1": 0.12336778045780654}, "score": 3.016522884481271}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27653123465652946, "2": 0.23076686973363822, "4": 0.22660578525982283, "5": 0.13786421879073604, "1": 0.12822131303376338}, "score": 3.0151248870391334}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2662879864559979, "2": 0.24838530233926934, "4": 0.19955160588257115, "1": 0.15925458400235473, "5": 0.12651145772690212}, "score": 2.8856790148335265}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2734698502342767, "2": 0.2468809110795568, "4": 0.20864296275991256, "1": 0.13923957058991843, "5": 0.13175598047384818}, "score": 2.946794300824408}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26548514258441513, "2": 0.24119732610276182, "4": 0.2086907266004513, "1": 0.1429483075125844, "5": 0.14166796982548627}, "score": 2.9649323559532785}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2716222404141739, "2": 0.23144046711912314, "4": 0.22486856567878902, "5": 0.146793829068998, "1": 0.12526591264764184}, "score": 3.036484259216048}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26827859629580336, "2": 0.24217450927395398, "4": 0.21189135756094826, "1": 0.13998780042376197, "5": 0.13765881640604902}, "score": 2.965058568572621}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3117328836559514, "2": 0.26594392518464527, "4": 0.2071690815603173, "1": 0.12343526874993029, "5": 0.09170883110950799}, "score": 2.877771057614937}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3342989922729178, "2": 0.2859896378821338, "4": 0.1951574910459007, "1": 0.1102996418258932, "5": 0.07424288728717487}, "score": 2.8370524946833138}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3382922540997075, "2": 0.28062534249898563, "4": 0.19543856391853764, "1": 0.10883895133895413, "5": 0.07679409728887716}, "score": 2.850721902481102}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3397621041324222, "2": 0.2631348606745434, "4": 0.20343340007977975, "1": 0.10889523562503063, "5": 0.08476030052406636}, "score": 2.892027146897922}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3345626909778769, "2": 0.2579187928505312, "4": 0.2102643984401369, "1": 0.10381777293777958, "5": 0.09342142222832764}, "score": 2.9315518827491993}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3056142173590994, "2": 0.2922555757827946, "4": 0.1928242165848684, "1": 0.1261411576862726, "5": 0.08315060478068649}, "score": 2.8145848969407345}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30417262297553865, "2": 0.2792208592789912, "4": 0.20096301355893004, "1": 0.12672935873364952, "5": 0.08890507957660965}, "score": 2.8460922006567917}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29278975127022006, "2": 0.25859017665641926, "4": 0.22329015718331094, "1": 0.12122187922264602, "5": 0.10409774140440442}, "score": 2.9304509889345973}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2940874520271568, "2": 0.2595104519301038, "4": 0.2204996436932875, "1": 0.11969189256483562, "5": 0.10620123937974238}, "score": 2.9340072703140376}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28814769512602817, "2": 0.26379051357934885, "4": 0.20793091372630063, "1": 0.13840621925425434, "5": 0.10171484683545319}, "score": 2.8707563872384068}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29782089400339745, "2": 0.2622551746908804, "4": 0.1996715724440473, "1": 0.1387428304670781, "5": 0.10149171595885417}, "score": 2.8629117268606623}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.307099125237755, "4": 0.25351355144575244, "2": 0.2221579641314434, "5": 0.13317070200325498, "1": 0.0840477154787152}, "score": 3.1296029784406962}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31306479408792326, "2": 0.2650538410127138, "4": 0.20485874215808372, "1": 0.121083692370148, "5": 0.09592421752849328}, "score": 2.889484325462332}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3108684955864541, "2": 0.23504511606713555, "4": 0.23433473367592614, "5": 0.12213206740960726, "1": 0.09760944672810369}, "score": 3.0483353491179894}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31284281596332514, "2": 0.24704514148598258, "4": 0.22614425203167934, "5": 0.10897994549118023, "1": 0.10497624421431057}, "score": 2.987106363522764}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2808986642877034, "3": 0.26909828348365505, "4": 0.1811001293222467, "1": 0.1656197633915587, "5": 0.1032708324936851}, "score": 2.775500835832851}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27925609917502286, "2": 0.27574537318779796, "4": 0.18939687459057963, "1": 0.16075069377670076, "5": 0.09483739362253765}, "score": 2.7818219413678498}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2851759844452411, "2": 0.2715019655607268, "4": 0.19607653721116478, "1": 0.14205179988177244, "5": 0.10518228356893534}, "score": 2.8508338341551074}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2884856021995823, "2": 0.2604332209948007, "4": 0.21170406485713114, "1": 0.12953307824448584, "5": 0.10983375220635946}, "score": 2.9118712856909097}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2796523092794058, "3": 0.27052201437392037, "4": 0.17975030240823572, "1": 0.17124337306829204, "5": 0.09881907757539232}, "score": 2.7552462391180366}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "human", "scores": {"2": 0.28505538051335066, "1": 0.263550678821581, "3": 0.23426425638835188, "4": 0.13274602006333863, "5": 0.08436370545700254}, "score": 2.489306500013682}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27658936763161596, "2": 0.25564579649821756, "4": 0.2050183072853711, "1": 0.14847008334369244, "5": 0.11426668734055057}, "score": 2.8809645572448566}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.27222016770886187, "3": 0.24901784958658393, "1": 0.21790639263294753, "4": 0.16022299745506793, "5": 0.10061864505204915}, "score": 2.653422500672387}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2545150268849637, "2": 0.24883170364730428, "4": 0.18896208358517905, "1": 0.1779080028888117, "5": 0.12976912097123328}, "score": 2.8438504203238137}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2799469382560093, "3": 0.25155812571060965, "1": 0.21743898424865624, "4": 0.16061687632824323, "5": 0.0904258591450254}, "score": 2.626638753406451}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2763024997119868, "4": 0.23552448515407792, "2": 0.23180847199894608, "5": 0.14221151320742573, "1": 0.11413923684808112}, "score": 3.059861391546752}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2870326519021197, "2": 0.24673070506939893, "4": 0.22819729391870472, "5": 0.12551251553550924, "1": 0.1125123371269029}, "score": 3.007467053912273}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2961483700716364, "2": 0.25579787426923817, "4": 0.2249744362273329, "5": 0.11493816395190276, "1": 0.10813000778803016}, "score": 2.982792682463966}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28386091406218733, "4": 0.24775133928364276, "2": 0.23759847734376954, "5": 0.1294545790879523, "1": 0.1013172495892782}, "score": 3.0664286794954525}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27866498201069084, "4": 0.24522449055337944, "2": 0.2187642090930523, "5": 0.15551395634118595, "1": 0.10181846563588026}, "score": 3.1338531229429005}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2890814490366032, "2": 0.2632222096295585, "4": 0.20545798880176686, "1": 0.1386247689555139, "5": 0.10360180774841156}, "score": 2.872188351669998}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2978462992091726, "4": 0.26211750064813355, "2": 0.21817475693851576, "5": 0.13695305172824532, "1": 0.08489686603078907}, "score": 3.148056821525305}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29258223690910323, "4": 0.25036483122491604, "2": 0.2263514950693609, "5": 0.13772738756942174, "1": 0.09296536263394134}, "score": 3.113538372288175}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2918431437454787, "2": 0.24200785371119593, "4": 0.23297607805013884, "5": 0.12542564074927426, "1": 0.1077306875432453}, "score": 3.026358568203088}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29251041678622286, "4": 0.2593071014004891, "2": 0.2204353112838128, "5": 0.13648739676662003, "1": 0.09124907714957431}, "score": 3.1293498129556947}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29108149484612483, "3": 0.28384118641420375, "4": 0.18487203425001156, "1": 0.15483714373508772, "5": 0.08535587482063188}, "score": 2.7548249942745513}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.299440393879432, "2": 0.267888802665431, "4": 0.21026433536082684, "1": 0.1261532299727129, "5": 0.09624454333930285}, "score": 2.882557138288461}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30327985071775293, "2": 0.2495687626395573, "4": 0.23784558937519512, "5": 0.11063800757140041, "1": 0.09866000820619826}, "score": 3.0122329206563903}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30427018677924667, "4": 0.2570337190921621, "2": 0.23255100538838613, "5": 0.12331881316961464, "1": 0.082818865445387}, "score": 3.105483390797364}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30041440725676083, "2": 0.269710208024371, "4": 0.21921179851821257, "1": 0.10866580671288065, "5": 0.10198963382797059}, "score": 2.936148724613254}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2830034190395618, "3": 0.2532310920107427, "1": 0.22022762685644454, "4": 0.1527274375786145, "5": 0.09078553611056725}, "score": 2.610830151230851}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.279426022337041, "3": 0.24185166386434753, "1": 0.21864525559206363, "4": 0.15612436153380022, "5": 0.10393679551702571}, "score": 2.6472758103244165}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2718990557863947, "3": 0.2613925182619053, "1": 0.19237442034096597, "4": 0.17376961653312353, "5": 0.10054961416660778}, "score": 2.71821678507609}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2599266508196152, "2": 0.2399178274242056, "4": 0.21629877704825898, "5": 0.142108930395825, "1": 0.1417294245494932}, "score": 2.9771395409183015}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2507876283971682, "2": 0.24329990978259095, "4": 0.19530057439757778, "1": 0.17874676419097194, "5": 0.1318468839180302}, "score": 2.858198317703742}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27221665609134843, "2": 0.26622184873480725, "4": 0.18430731949200538, "1": 0.16509389604489286, "5": 0.11214704129951375}, "score": 2.8121892749646884}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.25999353855160884, "2": 0.25540044321738103, "4": 0.1960614987174943, "1": 0.1713565852203877, "5": 0.11717733592722278}, "score": 2.8323007795760837}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2768202501107425, "3": 0.2497759407451036, "1": 0.1985338230839834, "4": 0.16875817600553675, "5": 0.10610041733055015}, "score": 2.7070677770919374}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2585784627867379, "2": 0.24586442816113685, "4": 0.20585299117995912, "1": 0.1586832820656996, "5": 0.13101018640332981}, "score": 2.9046413561814424}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.27691158817663963, "3": 0.2507090187983642, "1": 0.2065779822198004, "4": 0.16616302404219463, "5": 0.09962591076313693}, "score": 2.6753432425345665}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2664970246443768, "3": 0.2638976078821291, "4": 0.19005330377179996, "1": 0.17525570501792584, "5": 0.10428153187577922}, "score": 2.781604694737873}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27450003239993737, "2": 0.24808662486389663, "4": 0.21109525539671145, "1": 0.14605668196202115, "5": 0.1202470382785248}, "score": 2.91138807006946}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27032636248212727, "2": 0.24844517041094594, "4": 0.21058140047821802, "1": 0.14930348984422936, "5": 0.12133403707034626}, "score": 2.90619642966026}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2802497245227558, "2": 0.24986520163424006, "4": 0.21736217662438695, "1": 0.13025143254279084, "5": 0.12226028784702811}, "score": 2.951514143680506}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27899648383001213, "2": 0.24460194597907012, "4": 0.218972637476795, "1": 0.13586651263494184, "5": 0.12154954761848343}, "score": 2.9457360629544116}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3149670968678567, "2": 0.27637995815795013, "4": 0.19460638478094253, "1": 0.12253879564415278, "5": 0.09148824361843481}, "score": 2.8561225139491273}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3033387533840261, "2": 0.2606702188228893, "4": 0.2040738991499149, "1": 0.12741278342784232, "5": 0.1044913172025672}, "score": 2.897559413279204}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32492866924098646, "2": 0.27319028826382, "4": 0.2022120256760182, "1": 0.11183834483579169, "5": 0.0878195972451046}, "score": 2.8809829241478577}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3040445628489557, "2": 0.24617350174615749, "4": 0.22222028818092154, "5": 0.1167386037053163, "1": 0.11080873190137285}, "score": 2.9879063569630606}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31076185490087405, "2": 0.287730270056072, "4": 0.18297936354739913, "1": 0.13485311903517486, "5": 0.08366355671051258}, "score": 2.7928675172737263}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3088357490139, "1": 0.2667270841718504, "3": 0.23619715976377495, "4": 0.12085624470231135, "5": 0.0673724364133796}, "score": 2.413304555297125}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.30411200741232114, "3": 0.24591736847133983, "1": 0.23588060806400252, "4": 0.13663157625908703, "5": 0.07744823509874588}, "score": 2.5156498802712477}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3155349268368866, "1": 0.26546844409411957, "3": 0.2348607485106289, "4": 0.11869971243375364, "5": 0.06542767139431271}, "score": 2.4030781683134403}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2789463805609245, "3": 0.25372938330146194, "1": 0.2097848913816285, "4": 0.15835847290137575, "5": 0.09917136159203668}, "score": 2.6581817819802627}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.3086545464918851, "3": 0.2502231898481334, "1": 0.2353311989066279, "4": 0.133884003425167, "5": 0.07189705318533339}, "score": 2.49835614496733}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29611478875056724, "3": 0.2664678448178029, "1": 0.19407387372595608, "4": 0.16724599942346505, "5": 0.07607960900648447}, "score": 2.635136155908365}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2833041566493606, "4": 0.2544520931008981, "2": 0.20530169474971827, "5": 0.1647793125548775, "1": 0.09214535528398973}, "score": 3.1944216934314813}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27011561714285454, "4": 0.2683726444247769, "2": 0.19828947916650347, "5": 0.1710004484445786, "1": 0.09220965831012364}, "score": 3.227667512259167}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.278910426689747, "4": 0.2587053007630183, "2": 0.20272497935276718, "5": 0.170910611315694, "1": 0.08872444817210476}, "score": 3.2203579877882675}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2694127469641413, "3": 0.2685907858063076, "2": 0.19093805937441688, "5": 0.1848187063610483, "1": 0.08622322552148912}, "score": 3.275670191203359}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30842144604679106, "2": 0.2867383647734724, "4": 0.18438301161591839, "1": 0.13579482121060427, "5": 0.08464773736985307}, "score": 2.7953474873492663}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31815432982931924, "2": 0.2638291353375806, "4": 0.20282646860049888, "1": 0.11001011091552541, "5": 0.10516157521610485}, "score": 2.9292989623718673}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.322370394835298, "2": 0.2560507018528515, "4": 0.21683499638582598, "1": 0.10400563485608594, "5": 0.10072576026557273}, "score": 2.9542239726112483}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3115192016868642, "2": 0.2476547103348901, "4": 0.22508224730381057, "5": 0.11753489626514223, "1": 0.09819639255391527}, "score": 3.0161047465358246}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31080819294785533, "2": 0.25297027178112996, "4": 0.2145559361538137, "1": 0.11595526602136316, "5": 0.105692314420826}, "score": 2.9410586991274643}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28576999642941725, "2": 0.25682301215132525, "4": 0.20721424934320692, "1": 0.13765767384261451, "5": 0.11252169854278132}, "score": 2.900117951200121}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2796515542191901, "2": 0.23408316986501504, "4": 0.22557204072389853, "5": 0.1335466131383112, "1": 0.12712905848126255}, "score": 3.0043240561188527}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2829013864042459, "2": 0.2411849047603198, "4": 0.21921885725176984, "5": 0.1308366605232741, "1": 0.1258474273251884}, "score": 2.988012289855084}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28551862945025175, "2": 0.25748302072099666, "4": 0.20565840802934504, "1": 0.14257746684536965, "5": 0.1087528937687011}, "score": 2.880525096443817}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28765535484813276, "2": 0.2503062026471176, "4": 0.21521021163173062, "1": 0.12980068465944244, "5": 0.11701848092901179}, "score": 2.9393390516149926}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2943412413068552, "4": 0.2770295499402185, "2": 0.20865072442249324, "5": 0.14941716798507876, "1": 0.07054790474432178}, "score": 3.2261203846356237}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29053506624774733, "4": 0.2802689503132952, "2": 0.20076199038373585, "5": 0.16049000700523977, "1": 0.0679343623179258}, "score": 3.264620795943824}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2918197972278523, "4": 0.25509547299331675, "2": 0.22458273716128063, "5": 0.14029656155201828, "1": 0.08819495651270519}, "score": 3.134717357014735}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2853206338597126, "4": 0.2816890714069102, "2": 0.20063139704974223, "5": 0.1642510547540474, "1": 0.0680990919488503}, "score": 3.2733639921705917}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2918511987274044, "4": 0.2759557368108455, "2": 0.20784711366601444, "5": 0.15126060028470753, "1": 0.07307638609863697}, "score": 3.224479063839874}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2734131384685515, "2": 0.2638290298059476, "4": 0.18463996227110982, "1": 0.17243721151310257, "5": 0.10565149336485981}, "score": 2.7872332909177286}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.24885148655410433, "2": 0.23960771829701902, "4": 0.19291471093560453, "1": 0.18098618076422415, "5": 0.1376135065820944}, "score": 2.866558121826822}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2760518689344142, "2": 0.24826158760154393, "4": 0.21599064120311567, "1": 0.13258686015422977, "5": 0.12709572961173446}, "score": 2.956746216700809}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27290861047682974, "2": 0.24293975213087682, "4": 0.22109791970613926, "1": 0.1321848707826078, "5": 0.1308558425837175}, "score": 2.9754997925689484}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2689566943195144, "2": 0.25837207029737036, "4": 0.20364899089388339, "1": 0.15052898830778658, "5": 0.11847562923761824}, "score": 2.881168107813088}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2791316624644014, "2": 0.2467508884665633, "4": 0.20087812461975255, "1": 0.14170197421860833, "5": 0.13152143984600112}, "score": 2.933765113585453}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2751336223147648, "2": 0.24263420475883168, "4": 0.20485425580075622, "1": 0.14003326184282153, "5": 0.13733080893650035}, "score": 2.9568145472685474}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26369430035035507, "2": 0.24613022824840242, "4": 0.1875115566508236, "1": 0.1593759184918397, "5": 0.14326286777813407}, "score": 2.909152944126543}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2637873481121788, "2": 0.2350181579384009, "4": 0.2010807520723293, "1": 0.15115505722452188, "5": 0.1489413760182803}, "score": 2.9616345676682077}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2804654596792323, "2": 0.2535046279257964, "4": 0.20030012745300654, "1": 0.140973366008971, "5": 0.12474217147837054}, "score": 2.9143318899134982}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2825755868821365, "2": 0.2545777980299576, "4": 0.20693041534170448, "1": 0.1433283108726415, "5": 0.11257653247077162}, "score": 2.890847820931896}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27243495244436045, "2": 0.25552165948397265, "4": 0.20710188680983693, "1": 0.1544372984952255, "5": 0.11049078004635933}, "score": 2.863685360714864}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.275206624948136, "2": 0.2506320128165137, "4": 0.2124754769213778, "1": 0.14228706180224376, "5": 0.11938701930167844}, "score": 2.916042388050447}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29159955643230745, "2": 0.23810012511903997, "4": 0.23381440952497126, "5": 0.12367372885860249, "1": 0.11280183187764528}, "score": 3.017458259029183}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26951066934780754, "2": 0.23035589417911723, "4": 0.22718634390352752, "5": 0.13825275653612315, "1": 0.13468204508947698}, "score": 3.0039719214363663}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29865763353296687, "4": 0.2585958398432997, "2": 0.22093533988059436, "5": 0.1336105037615998, "1": 0.0881894445001753}, "score": 3.1285040626760683}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3037593812593075, "2": 0.25034890852799724, "4": 0.23663800750423772, "5": 0.1060800480059404, "1": 0.10316302242275655}, "score": 2.9921230663928466}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2991309026181578, "2": 0.24879647157255758, "4": 0.2314402819668235, "1": 0.11133066967885266, "5": 0.10929422734174737}, "score": 2.978570766140368}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.294550297794454, "4": 0.25979053689126586, "2": 0.21902274414823428, "5": 0.13914525381501877, "1": 0.08748089957664915}, "score": 3.1440979807853258}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3019324385637202, "2": 0.24187766431571217, "4": 0.2399701832059576, "5": 0.11221120775699439, "1": 0.10399535960696783}, "score": 3.0145244061361396}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2791762712682117, "4": 0.23365189487079527, "2": 0.22454532479380632, "5": 0.14966504726832391, "1": 0.11295393480243084}, "score": 3.0825294162073966}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27766806207939815, "2": 0.25313809731016934, "4": 0.20886812646850425, "1": 0.141543597473702, "5": 0.1187679725179129}, "score": 2.91017750878394}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2774440188556978, "2": 0.233699471239701, "4": 0.22721072230610628, "5": 0.14412314085611988, "1": 0.11751552811021755}, "score": 3.046726809189176}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27742002098598956, "2": 0.2443478632335833, "4": 0.21781841979451377, "5": 0.1320830483584015, "1": 0.12832020978591133}, "score": 2.980996035345538}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27110881698702927, "2": 0.22851911908586292, "4": 0.22613568132694317, "5": 0.14936595655803356, "1": 0.12486209383841466}, "score": 3.046624676166618}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3057194890222978, "3": 0.27505478031720726, "1": 0.19458748941836498, "4": 0.15503544667224817, "5": 0.06958522629846461}, "score": 2.5993043918809504}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3094312636163017, "4": 0.2752159546108587, "2": 0.20749403224293103, "5": 0.14240483883481822, "1": 0.06544548977509582}, "score": 3.2216424869210227}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33045882877229127, "4": 0.2610681485985616, "2": 0.22557910123926964, "5": 0.11830999771857688, "1": 0.0645746732513417}, "score": 3.1429610187432235}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29564800635459976, "4": 0.27816394747515866, "2": 0.20546115287915775, "5": 0.15404392345422252, "1": 0.06667586737498668}, "score": 3.2474406641923568}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3045899905579831, "4": 0.28089276547769115, "2": 0.19952957660132042, "5": 0.1551577403298876, "1": 0.05982035448122992}, "score": 3.2720405646961073}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2626662931003942, "2": 0.23925436602912775, "4": 0.2061372850249303, "1": 0.14798768768443454, "5": 0.14393693884653386}, "score": 2.958780702895905}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2524421412723353, "2": 0.23434748183218482, "4": 0.20471129695037432, "5": 0.15624312364594312, "1": 0.15223591332341518}, "score": 2.978377802390062}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2528629845490712, "2": 0.22614368667175594, "4": 0.21433940835753287, "5": 0.16187954009544087, "1": 0.14476232780100334}, "score": 3.022430416617814}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2542997982267783, "2": 0.2494097381967248, "4": 0.19107304299182015, "1": 0.1663434253986377, "5": 0.1388587429973418}, "score": 2.886692211800737}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.26437355365634047, "3": 0.2500161157993883, "1": 0.1963132855820191, "4": 0.1734740081068778, "5": 0.11580992608844297}, "score": 2.7480904327357605}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2765676562184409, "2": 0.25091204991483884, "4": 0.2100819891366979, "1": 0.1455986667788707, "5": 0.11683325869737334}, "score": 2.9016384955858654}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2805801654556929, "2": 0.23518185806735936, "4": 0.2342078055051669, "5": 0.1339036992106604, "1": 0.11611873892340899}, "score": 3.0345961355386124}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28373851124801663, "2": 0.25252404678732027, "4": 0.21111450816191638, "1": 0.13417770511860838, "5": 0.11843874167036599}, "score": 2.9271120616530517}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.279980449910151, "2": 0.2423426367168648, "4": 0.2228412599029324, "1": 0.13242857970159583, "5": 0.12240051517092289}, "score": 2.9604422346812598}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28887526298833544, "2": 0.2514967278660355, "4": 0.2185132992862813, "1": 0.12885463119494928, "5": 0.11225404695033518}, "score": 2.933815003722045}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "human", "scores": {"3": 0.24925203641576105, "2": 0.24379226238253385, "4": 0.1971324778222323, "1": 0.17738648425041617, "5": 0.13242623573647921}, "score": 2.863418283840441}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.250170773580656, "3": 0.24901774997946402, "4": 0.19704936458199307, "1": 0.17780379711998012, "5": 0.12594837225583244}, "score": 2.843166181955617}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2660934542862085, "2": 0.22828306657743253, "4": 0.22349266148200383, "5": 0.14669508472767703, "1": 0.1354261913983054}, "score": 3.017747550902075}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2613106629443975, "4": 0.24826618048339857, "2": 0.20521113562080753, "5": 0.17473671913216454, "1": 0.11046539218228198}, "score": 3.1715993992501033}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.24732458394352025, "2": 0.2450827427361845, "4": 0.19632683166605877, "1": 0.17747784406972372, "5": 0.13377758118473407}, "score": 2.863842144885243}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2710702680541478, "3": 0.2661621418705112, "1": 0.200336104586547, "4": 0.16289944017460897, "5": 0.09951538735402987}, "score": 2.6901825767291343}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.27622075389721173, "3": 0.26231185415812697, "1": 0.19231048571016893, "4": 0.1663346925980423, "5": 0.10281297684778856}, "score": 2.7111162526179475}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.26718176083434375, "3": 0.26504641960906555, "1": 0.1878811682082815, "4": 0.17480014259502885, "5": 0.10508187192911034}, "score": 2.7420175610533786}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.3063963970990338, "3": 0.26855125215238523, "1": 0.19384682376764037, "4": 0.15182628098306591, "5": 0.0793714934303943}, "score": 2.616476249915787}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2770959341728977, "3": 0.2552581226787507, "1": 0.21497679218636634, "4": 0.15813494945899742, "5": 0.09451967170079754}, "score": 2.6401195453231434}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.280908861094288, "2": 0.2740375878687281, "1": 0.1768864106777081, "4": 0.17358659456243436, "5": 0.0945665934565332}, "score": 2.7349056735651}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28692615384693515, "2": 0.271160305440049, "4": 0.18054386704791783, "1": 0.16380489893210412, "5": 0.09755321060994815}, "score": 2.7768776047487242}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3007856181652836, "2": 0.28124674468045086, "4": 0.18233447569686567, "1": 0.14484606806633463, "5": 0.0907780103015728}, "score": 2.792949734830803}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28837839202748955, "2": 0.2695303173917655, "4": 0.1899782095457458, "1": 0.1523260332007615, "5": 0.0997754218543151}, "score": 2.815344522660216}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28458906967058933, "2": 0.2651083681957386, "4": 0.1903075559506126, "1": 0.1556658743224466, "5": 0.10431772384628381}, "score": 2.822500861889837}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2821760816184787, "2": 0.2582202438206226, "4": 0.21141228386930136, "1": 0.1407809982466661, "5": 0.10739817388337669}, "score": 2.8864250035990153}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2948553446574686, "2": 0.24954220993584136, "4": 0.2228760481387544, "1": 0.1201049301937248, "5": 0.1126120672315097}, "score": 2.95834772075361}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2943320580033867, "2": 0.2560681394993928, "4": 0.22090922686672998, "1": 0.12660198374538484, "5": 0.10207896485133641}, "score": 2.915794238927535}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2897638204664626, "4": 0.23906715099692386, "2": 0.23384382522789843, "5": 0.1275528360285237, "1": 0.10976191148754494}, "score": 3.040805601505891}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2953579997306903, "2": 0.25578418944903697, "4": 0.22055400355503563, "1": 0.12104094526581753, "5": 0.10725474282577853}, "score": 2.9371968993166413}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27994223518695244, "4": 0.25794997711763784, "2": 0.21445827107122606, "5": 0.15947128568776595, "1": 0.08816993915242285}, "score": 3.186095942184453}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27668574815581115, "4": 0.2483390324676159, "2": 0.21259883348279424, "5": 0.16429805370369166, "1": 0.09806642733358271}, "score": 3.1682054541868347}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28017723329616623, "4": 0.24990208445988685, "2": 0.21502265162687514, "5": 0.15925181299670094, "1": 0.0956350972741989}, "score": 3.162114667049232}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28098831335422547, "4": 0.2750830023854352, "2": 0.19938588725745277, "5": 0.17356118334513693, "1": 0.07097265620452492}, "score": 3.2808766853489773}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27098573442124707, "4": 0.25881522212042574, "2": 0.20326189668330097, "5": 0.17982433882581955, "1": 0.08710228162515614}, "score": 3.240999976682302}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2932615517698069, "3": 0.276322587633903, "1": 0.17683464360178386, "4": 0.16697177380207157, "5": 0.08658864431621963}, "score": 2.6932118426122265}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.29879253777935644, "3": 0.28498207369714335, "1": 0.1730605059941811, "4": 0.15996324642170592, "5": 0.08318465360760302}, "score": 2.6814135934755416}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3032101650152519, "2": 0.2920680663324761, "4": 0.1711590907035368, "1": 0.15043611048124866, "5": 0.08310945541662788}, "score": 2.744433340972152}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.278872999421911, "2": 0.2720323461737771, "4": 0.19438456271717613, "1": 0.15191588491940788, "5": 0.10278477911573496}, "score": 2.824088346502203}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2814441929223517, "2": 0.25909463446094283, "4": 0.20022963421568074, "1": 0.147763183241437, "5": 0.11144648036987313}, "score": 2.8684987174487073}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3237177774609123, "2": 0.3078120837194981, "3": 0.2127147526978375, "4": 0.09910020193094363, "5": 0.05664314528368291}, "score": 2.2571299105129734}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2987821399799645, "1": 0.27071913439158535, "3": 0.23392353278493236, "4": 0.11988276165146623, "5": 0.07667843273852071}, "score": 2.4330112814001423}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3136099069391271, "1": 0.29669345833716315, "3": 0.22181466236642575, "4": 0.10559093016369354, "5": 0.062282075952575275}, "score": 2.3231521896747926}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.28545559389625036, "3": 0.249796473171304, "1": 0.230907218652184, "4": 0.1421683016948839, "5": 0.09165937670505946}, "score": 2.5782115255203113}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2952007044235584, "1": 0.2649197047111553, "3": 0.23128665662885414, "4": 0.12626267750333547, "5": 0.08231880533607497}, "score": 2.465854057612363}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2806319372720226, "4": 0.24061707729726617, "2": 0.23259747372129458, "5": 0.13656289517041661, "1": 0.10957073023880234}, "score": 3.0620051664925545}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2955699655827573, "2": 0.2561171812437041, "4": 0.21834947575332067, "1": 0.12030123380330782, "5": 0.10964422204880346}, "score": 2.940917212144402}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30037430461030323, "2": 0.2586150542280056, "4": 0.22166806915486045, "1": 0.11285455649182835, "5": 0.10647665710172512}, "score": 2.9502966515954756}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3028628246229175, "2": 0.24926838788567232, "4": 0.2271996574133623, "5": 0.11153949896575749, "1": 0.10911207652655323}, "score": 2.982785812218163}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2867521572205238, "2": 0.24157086791834048, "4": 0.22715871972369298, "1": 0.12235610408284671, "5": 0.1221469440013838}, "score": 2.985169306111276}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29165161159891595, "2": 0.2531295160741234, "4": 0.2096501059498756, "1": 0.13480708803827451, "5": 0.11075061688551881}, "score": 2.9084066344145056}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29282807995721916, "2": 0.2845254995734692, "4": 0.18808821452642316, "1": 0.15030462663935695, "5": 0.08424045583704988}, "score": 2.771431373735635}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2985012376281856, "2": 0.24825384196084338, "4": 0.21409678496718917, "1": 0.1270389559239303, "5": 0.11210079018492591}, "score": 2.9359660743262874}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2987262131982703, "4": 0.24720394371159196, "2": 0.22235850772411503, "5": 0.13983855505122095, "1": 0.0918640051910739}, "score": 3.120795595704069}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3073341152191106, "4": 0.2399059997668677, "2": 0.22981016050242167, "5": 0.12639070959628884, "1": 0.09654828819406523}, "score": 3.069781430594847}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "human", "scores": {"3": 0.33564181983839086, "2": 0.26238316021014063, "4": 0.23740541202356777, "5": 0.08406673762900316, "1": 0.08049552388633766}, "score": 2.9821645482721713}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3186008543290172, "4": 0.2794437943972072, "2": 0.21496105646111285, "5": 0.12507181333069992, "1": 0.061915037292349116}, "score": 3.19079771034713}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.34040162789299777, "2": 0.2702043917195118, "4": 0.22552192418460337, "1": 0.08544725448609262, "5": 0.0784169402773821}, "score": 2.9412564422387497}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3372525914032992, "2": 0.2550644297632723, "4": 0.23539444089595485, "5": 0.09431761588019712, "1": 0.07796211308319964}, "score": 3.013041131605667}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.33501653170551166, "2": 0.26336257079945763, "4": 0.23360372081698855, "5": 0.09240997976980721, "1": 0.07559984092239408}, "score": 3.003861456117173}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3023575565051191, "2": 0.29351480442941735, "4": 0.17778208860168376, "1": 0.1463961171508929, "5": 0.07993695639831669}, "score": 2.7513458602306544}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3182926615807239, "2": 0.26221570825701307, "4": 0.21106589408881207, "1": 0.10894809530824417, "5": 0.09946323505828981}, "score": 2.9298794551958736}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3210568720659918, "2": 0.27158809964434616, "4": 0.20310808565233202, "1": 0.11391070807477047, "5": 0.09032502727349632}, "score": 2.8843473282525145}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3132649377469187, "2": 0.2552924572051961, "4": 0.22354326594877283, "1": 0.10424775013238942, "5": 0.10364089372144533}, "score": 2.967036743371574}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2970898680269519, "2": 0.263085580130406, "4": 0.20391425339397257, "1": 0.1290838610726799, "5": 0.10681586658078591}, "score": 2.896291587999394}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3284255838175236, "2": 0.29953437301958724, "4": 0.1899357161733313, "1": 0.1217221853748218, "5": 0.06037039157158235}, "score": 2.767695025953796}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3423291081861321, "2": 0.2953217910595602, "4": 0.2020857230634208, "1": 0.0929161319212595, "5": 0.0673314864220991}, "score": 2.855592365235438}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33017852036187506, "2": 0.25131166924383525, "4": 0.23910583519142206, "5": 0.09261263495867872, "1": 0.08678275084914233}, "score": 2.9994539294762443}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3384838494094924, "4": 0.25564725368341057, "2": 0.23728802034013732, "5": 0.09875273296390694, "1": 0.06981825293731053}, "score": 3.076228947351504}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.33644745286371247, "2": 0.2798791992936963, "4": 0.22501840052734395, "1": 0.08869938705554553, "5": 0.06994771811927186}, "score": 2.90763513902289}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2927740581601311, "2": 0.26459318063179627, "4": 0.19864302685612256, "1": 0.14054929466980956, "5": 0.10342880265909497}, "score": 2.8598072307764113}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2842090556995702, "2": 0.24745646782974706, "4": 0.21243160526529795, "1": 0.13262074042501942, "5": 0.12327166507074964}, "score": 2.9462764244716704}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29357104725383654, "2": 0.25361862923208517, "4": 0.21722052439800527, "1": 0.12087607883941345, "5": 0.11470387174627406}, "score": 2.951257000932734}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29739302455174393, "2": 0.2455075938614715, "4": 0.22376714479065402, "5": 0.1184376638827207, "1": 0.11488286901243853}, "score": 2.9853689694296146}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30647272994841285, "2": 0.2586993506095278, "4": 0.21244704960439564, "1": 0.11480611844013781, "5": 0.1075639956680775}, "score": 2.939262800177859}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28602850651498574, "2": 0.2791522910564746, "4": 0.18040279105378257, "1": 0.15788073069993194, "5": 0.09652013881760638}, "score": 2.7785258741134147}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2974274051725437, "3": 0.29277098404865953, "4": 0.1719586049550623, "1": 0.15588296151612477, "5": 0.08194690839559647}, "score": 2.726655502912199}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30788452042464143, "2": 0.28359920147545725, "4": 0.19120376254037685, "1": 0.13606277756606477, "5": 0.08123579531082452}, "score": 2.797947779404452}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29153911410932226, "2": 0.2897297462447792, "4": 0.18295449834152203, "1": 0.15031325437253962, "5": 0.0854530394610405}, "score": 2.7635018751163036}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2919975112110521, "2": 0.26720073141281053, "4": 0.19888245642575103, "1": 0.13683587007686798, "5": 0.10507249904417112}, "score": 2.8681535416245643}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2638217218430377, "2": 0.24487355590718932, "4": 0.2021321879120828, "1": 0.15861815594646217, "5": 0.13054018089920244}, "score": 2.9011012777965544}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2741653739768199, "2": 0.23367827565889365, "4": 0.22141564439056247, "5": 0.14305379938492946, "1": 0.12767469440366896}, "score": 3.018495804568379}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27430797704487214, "2": 0.24859823492277996, "4": 0.20605311574626273, "1": 0.14505253381568653, "5": 0.12597768385232833}, "score": 2.9193043372544327}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2715710716043331, "2": 0.23977128240571152, "4": 0.21367799359277453, "1": 0.14060947670390295, "5": 0.13435872549906852}, "score": 2.961404766854479}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2681408169725353, "2": 0.23973215492531216, "4": 0.21386326858714247, "1": 0.14436639517525135, "5": 0.13388709618136735}, "score": 2.9531720348370984}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "human", "scores": {"2": 0.26962696133294184, "3": 0.26491520111445593, "1": 0.18602245253506444, "4": 0.17794828582052155, "5": 0.10147332732598292}, "score": 2.739219482633763}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.28632129202889184, "3": 0.267432628618181, "1": 0.18863921567293246, "4": 0.16845030474815262, "5": 0.08914475231055184}, "score": 2.683136344905323}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.271938538395663, "2": 0.2627126052501639, "4": 0.18839866553735846, "1": 0.16728358382198458, "5": 0.10965451812464704}, "score": 2.810425637152657}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27191860603132867, "2": 0.25898249666766127, "4": 0.19803923724821357, "1": 0.15631271420209006, "5": 0.11473289549717557}, "score": 2.85589507844563}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.27245386008614764, "3": 0.26803856756514344, "1": 0.18682472521159954, "4": 0.17574341798546161, "5": 0.09692782980789062}, "score": 2.723492559787046}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27993361309888953, "2": 0.2679672251945484, "4": 0.1944847548946418, "1": 0.15371489862289556, "5": 0.10388754115015778}, "score": 2.8268607427903976}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28449261032675355, "2": 0.26816342219620287, "4": 0.1964884162091584, "1": 0.14550650288523442, "5": 0.105336867753968}, "score": 2.847983872098415}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2797856233362246, "2": 0.2776776973283229, "4": 0.18166142983478697, "1": 0.16009503040974382, "5": 0.10076575633109185}, "score": 2.7853220795139553}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27885055104901674, "2": 0.26270285879330696, "4": 0.19627483157606646, "1": 0.1485615096651333, "5": 0.11359971289852458}, "score": 2.8636469426312816}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2798550747465002, "2": 0.2740263525579509, "4": 0.186093284764804, "1": 0.15712435768558275, "5": 0.10288953932077101}, "score": 2.803595058243388}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2834587128800501, "4": 0.23232333319926557, "2": 0.2180524170307835, "5": 0.14622826782208084, "1": 0.11991345556710256}, "score": 3.066902133852451}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26893617370660916, "4": 0.2396616840314931, "2": 0.19889051132834693, "5": 0.18226066341196148, "1": 0.11021866750634579}, "score": 3.1848611355318734}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28056905470113525, "4": 0.26544548206682744, "5": 0.19142819528950397, "2": 0.18625125192501724, "1": 0.07628980247629084}, "score": 3.3094760334706637}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2793014540482449, "3": 0.2646118880309657, "5": 0.20310371887543355, "2": 0.17719279533820576, "1": 0.07576804842018751}, "score": 3.35678788295119}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27517866537541164, "4": 0.25543821973643765, "5": 0.19426413992051764, "2": 0.18796648562423604, "1": 0.08712839009111738}, "score": 3.2817500237359036}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29623625032942824, "2": 0.2784522468072063, "4": 0.2022156453036734, "1": 0.14165259968460542, "5": 0.08143133737683937}, "score": 2.803318529339808}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30618695485916025, "4": 0.2725444660570342, "2": 0.21632704914596054, "5": 0.12826809670158026, "1": 0.07666311391806069}, "score": 3.1594290276769805}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29674627447324387, "4": 0.2698799630866021, "2": 0.21087741202650698, "5": 0.14406341419344096, "1": 0.07842159053981945}, "score": 3.1902883573182215}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2809985696148385, "4": 0.2563640434305361, "2": 0.2231837178135282, "5": 0.13560318710877808, "1": 0.10384114494888906}, "score": 3.0967053128823605}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2992334323459504, "4": 0.24360612494746173, "2": 0.23806150841064536, "5": 0.11874995678301, "1": 0.10033948424630339}, "score": 3.0423659638016196}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2933585200667983, "2": 0.2762647869947276, "4": 0.18181583496758727, "1": 0.16155650844936495, "5": 0.08699209730744158}, "score": 2.756419241285411}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29849864067871495, "2": 0.263882249488284, "4": 0.195568006638992, "1": 0.14474178748405836, "5": 0.09729466711273395}, "score": 2.8367891255976985}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29622505281080025, "2": 0.24608745453187647, "4": 0.220678916591392, "1": 0.11917663007383741, "5": 0.11782053524435016}, "score": 2.9718789515183506}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29369281641422296, "2": 0.25481601602973675, "4": 0.22226720383552964, "5": 0.11514673585644829, "1": 0.11406559515135112}, "score": 2.9696131157340924}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3020198908604096, "2": 0.27058483687906865, "4": 0.20123198142172682, "1": 0.13461591897572978, "5": 0.09153658962701215}, "score": 2.8444868090652893}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27070316243383363, "2": 0.2635501517207504, "4": 0.19500583456887202, "1": 0.15672476519824524, "5": 0.11400522480671818}, "score": 2.8460149295913992}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27536841141791557, "4": 0.2337386893012783, "2": 0.22966108506202923, "5": 0.14472171319031873, "1": 0.11649871920328903}, "score": 3.0605242810900943}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2694275381299634, "2": 0.2316703784795324, "4": 0.2229606010582609, "5": 0.14285572130068913, "1": 0.13307366924644912}, "score": 3.0108544579369814}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28103052096860376, "2": 0.24049463436929056, "4": 0.22037227579928959, "5": 0.1313688846078448, "1": 0.12671702856691705}, "score": 2.9891811733168523}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.260362418828003, "4": 0.2267268477365866, "2": 0.22243487874782178, "5": 0.15676418643370518, "1": 0.13369628250636878}, "score": 3.0504285527244175}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3059277243080308, "2": 0.2588068625237595, "4": 0.22695970233796575, "1": 0.1068328089207177, "5": 0.10146744204367283}, "score": 2.957421873589258}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2938337934215474, "4": 0.2535940040587582, "2": 0.22114178988518682, "5": 0.13734359502999574, "1": 0.09407986780187055}, "score": 3.1189804955207836}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29351958875972173, "4": 0.2487920181555746, "2": 0.23228614121091848, "5": 0.12807788801582728, "1": 0.09731691121604008}, "score": 3.078028412062045}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3069080769029744, "4": 0.28143817008106775, "2": 0.2037791438070863, "5": 0.14445777914095556, "1": 0.06340936598371286}, "score": 3.2397576421596965}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3037278830446816, "4": 0.2871192914297108, "2": 0.19830597753749285, "5": 0.14608728404234816, "1": 0.06475230374254273}, "score": 3.2514851003247647}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2796606710084605, "2": 0.27679503293461727, "1": 0.17920008573670274, "4": 0.1704553147817355, "5": 0.093874921980317}, "score": 2.723006083743746}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3034650595958737, "3": 0.29456858993591223, "1": 0.16601797721721306, "4": 0.16092333621201932, "5": 0.07501337860154163}, "score": 2.675445295584086}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.31821955815260894, "3": 0.2950187397746773, "1": 0.17074864775606335, "4": 0.14978909614013514, "5": 0.06621214325539322}, "score": 2.6224920687597555}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2997529630657304, "2": 0.27106934641680325, "4": 0.19524429688201594, "1": 0.1371335514346647, "5": 0.09678428915401169}, "score": 2.843473991447574}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30257027936983627, "2": 0.30118894105961375, "4": 0.17014402410263632, "1": 0.1499729701685474, "5": 0.07611096026331059}, "score": 2.721227487965031}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29269736140460684, "2": 0.23283894211216496, "4": 0.22542702198028405, "1": 0.12511031636015535, "5": 0.12391032010377481}, "score": 2.990187929988996}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.290531754166871, "2": 0.24506887144550688, "4": 0.2185749287260226, "1": 0.12405468531361767, "5": 0.12175692984432773}, "score": 2.968910147443469}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.299383715177679, "2": 0.2422657293698125, "4": 0.23181313139606002, "5": 0.11879463892093496, "1": 0.10773303609783294}, "score": 3.0116707214507543}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2856701372670703, "4": 0.2340942656702351, "2": 0.2317667038757128, "5": 0.14040346615240082, "1": 0.10805674210129759}, "score": 3.067021591974784}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2880078621750167, "2": 0.23072928087225447, "4": 0.22669381604128885, "5": 0.1310664804705086, "1": 0.12348045432674887}, "score": 3.01113683364867}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27528834592596196, "4": 0.2468115966519267, "2": 0.21506606908308332, "5": 0.15542300728191993, "1": 0.10740221213063329}, "score": 3.1277882384370836}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29412600941949946, "4": 0.24963672946688764, "2": 0.22535255319514252, "5": 0.13593784768767064, "1": 0.09493973092703145}, "score": 3.1062811675037514}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28018832853428904, "4": 0.2621598884749518, "2": 0.2102852787315913, "5": 0.15252298087890695, "1": 0.09483471924574638}, "score": 3.167252605524119}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2951501703887979, "3": 0.28931118657938815, "2": 0.18789069402498704, "5": 0.16885513854681025, "1": 0.058785873472960395}, "score": 3.327400277682999}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2887868518023571, "4": 0.26099772191305676, "2": 0.21632064596007344, "5": 0.1465858375891669, "1": 0.0873033014111464}, "score": 3.163243069216101}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2609870734232334, "4": 0.26073482090698125, "2": 0.1961410373907266, "5": 0.18870940251510604, "1": 0.0934115107412429}, "score": 3.255193689723834}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3060194551895504, "3": 0.25261888737209426, "5": 0.23729402380299544, "2": 0.15406655416876322, "1": 0.04998718532014038}, "score": 3.526573894281304}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.27809730737714616, "3": 0.2654149575915807, "5": 0.20662297980438693, "2": 0.18142551412614757, "1": 0.06842890198224272}, "score": 3.3730638060461837}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.27617460126539534, "3": 0.2653702124018562, "5": 0.19662348945462887, "2": 0.18752464541427033, "1": 0.07429411026875153}, "score": 3.3333130276918}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2778897852044771, "3": 0.26407661753639794, "5": 0.19585431244322501, "2": 0.18648952643512776, "1": 0.07567942137098278}, "score": 3.331753470252703}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26728550092854914, "2": 0.2350047387847031, "4": 0.22583853092391235, "5": 0.13795099025263843, "1": 0.1339039536279306}, "score": 2.998927847928111}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2798875118293559, "4": 0.24202617439915117, "2": 0.228799020618318, "5": 0.13540491761473616, "1": 0.11386439000921351}, "score": 3.0563092217430317}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2699153196775726, "4": 0.23602501117898375, "2": 0.2312167492395895, "5": 0.1421136200679072, "1": 0.12071175082302042}, "score": 3.047612835987442}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27172479716629927, "2": 0.2393256505220659, "4": 0.2289584117498269, "5": 0.13307119409922005, "1": 0.12690574924105336}, "score": 3.001963678822878}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27066023231671993, "4": 0.24272564655373713, "2": 0.23371879898516373, "5": 0.13755482693586116, "1": 0.1153281656614468}, "score": 3.0534608292652132}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28876516472414665, "2": 0.25547288505484456, "4": 0.21667769631218387, "1": 0.13052484332904668, "5": 0.10854707816183236}, "score": 2.9172482603938716}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2823700031909836, "2": 0.24660621150114495, "4": 0.2320918686818135, "1": 0.12107601590739821, "5": 0.11784704784733611}, "score": 2.979027535394014}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2825711222231347, "4": 0.2513747563899211, "2": 0.22395462827216556, "5": 0.1418920388977419, "1": 0.10019998901120415}, "score": 3.110805055073374}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28919230411372415, "4": 0.25592347627220624, "2": 0.22851482296680772, "5": 0.13162131567406274, "1": 0.09474018772621998}, "score": 3.101171707774361}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28902019916720517, "2": 0.25193070737908746, "4": 0.22452358985835413, "1": 0.1223118925763316, "5": 0.11220373473941204}, "score": 2.95237609645844}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30641113512018087, "2": 0.2599882347375215, "4": 0.21875672748503755, "1": 0.11294446965928942, "5": 0.10189269798061641}, "score": 2.936664522824632}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2931527425987355, "2": 0.25027714378388993, "4": 0.21639570060963326, "1": 0.1222842165267047, "5": 0.11787895336140485}, "score": 2.9573075504988267}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3063780445045133, "2": 0.25811676988446125, "4": 0.22069350394988554, "1": 0.10913790641191344, "5": 0.10566736341097381}, "score": 2.9556353636046726}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29698783518242894, "2": 0.24049018525970914, "4": 0.23832166123372678, "5": 0.12634784513781694, "1": 0.09784582044021933}, "score": 3.0548358901784676}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30540518762880753, "4": 0.2419504804509498, "2": 0.23283645074881318, "5": 0.12738737985164753, "1": 0.09241266893934572}, "score": 3.0790640707866213}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2864265917261338, "3": 0.28535835574087026, "1": 0.17115419562354264, "4": 0.16997003876895073, "5": 0.08707820117356263}, "score": 2.7153878672009863}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2944125982718628, "2": 0.29382021861387186, "1": 0.16569066382190004, "4": 0.1640911028846067, "5": 0.08197043053357135}, "score": 2.7028259642813666}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2942742274360284, "2": 0.28462202699304934, "4": 0.18250969209497706, "1": 0.14950599299975104, "5": 0.08907816823053555}, "score": 2.777029809887602}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29029942170891176, "2": 0.2635976740971192, "4": 0.20074576947024658, "1": 0.1387118803942099, "5": 0.10663337819342888}, "score": 2.872989582578564}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.28075280340482284, "3": 0.27864129649386865, "1": 0.18013233567919448, "4": 0.16986931038881012, "5": 0.09059090113047412}, "score": 2.710029765942188}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2762627150165951, "2": 0.24387309291443407, "4": 0.21571905267052832, "1": 0.13809837299367184, "5": 0.1260370207134219}, "score": 2.947722745717609}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2763005103411506, "2": 0.2427906329073549, "4": 0.21663674809730907, "1": 0.13443201129163856, "5": 0.12982910113938462}, "score": 2.964639906057962}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27070827877195286, "2": 0.23697998331507844, "4": 0.22309943724069814, "5": 0.13801684997645877, "1": 0.13118465082227132}, "score": 2.9997838498996003}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27800432718471385, "4": 0.23673618531041982, "2": 0.23067245924824592, "5": 0.14279463497293118, "1": 0.11178362454097741}, "score": 3.0680863439577135}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2762272727839263, "2": 0.246236136251773, "4": 0.21252118531222483, "1": 0.14131819909881027, "5": 0.12368617106155799}, "score": 2.9310202317602867}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2941829871456386, "2": 0.24349304487721837, "4": 0.22911298793778415, "5": 0.1196335450243074, "1": 0.11356767093924675}, "score": 2.997751669277816}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28931474512886807, "4": 0.2406362071153115, "2": 0.2374605677068654, "5": 0.12383748225198088, "1": 0.10874329131213605}, "score": 3.033364278409442}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29445641012600665, "4": 0.2339578518844363, "2": 0.23360245936030205, "5": 0.13607653420826324, "1": 0.10189718135796112}, "score": 3.0687147553482754}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3048475083578234, "4": 0.26527169873218603, "2": 0.21113310816940373, "5": 0.15018169769093134, "1": 0.06855914332707774}, "score": 3.2173851870144023}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29144825552849984, "4": 0.2504608645509041, "2": 0.22914859486269612, "5": 0.12656718564327152, "1": 0.10236496127303435}, "score": 3.0697174252338106}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "human", "scores": {"2": 0.32557409787471897, "3": 0.2859884367281771, "1": 0.20404822826813415, "4": 0.13019791020360985, "5": 0.05417950925740119}, "score": 2.5048805231498474}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2991723052000727, "3": 0.2955814043617643, "1": 0.1757975201354113, "4": 0.15376443354287891, "5": 0.07567016634370559}, "score": 2.654332522507383}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.33118494944518373, "3": 0.27813240547198037, "1": 0.2196832813764236, "4": 0.11695075853454033, "5": 0.054036312754502484}, "score": 2.454465165903644}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.295543513254597, "3": 0.2912024934571526, "1": 0.1755528573396025, "4": 0.15772725055074843, "5": 0.0799624603550726}, "score": 2.670999184478684}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.3268750144357645, "3": 0.256271230815148, "1": 0.252612066754214, "4": 0.11164143685110305, "5": 0.052591945412702235}, "score": 2.3847210693909853}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30286518696216264, "4": 0.26702077890386666, "2": 0.2255593413754958, "5": 0.12752893486666073, "1": 0.07701676912462282}, "score": 3.1424870497953643}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29848010448868345, "4": 0.2819142591056335, "2": 0.1959063970292425, "5": 0.1627712399180125, "1": 0.06091742624255909}, "score": 3.289718552684096}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30973539825615315, "4": 0.27030908917945257, "2": 0.2131809379346173, "5": 0.13259498797787247, "1": 0.07416980146450702}, "score": 3.173980226700688}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3121621233530476, "4": 0.28471408864214515, "2": 0.20476739553089324, "5": 0.14082706932610994, "1": 0.05751818041632967}, "score": 3.246567218363117}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2993734764297035, "4": 0.27944303989998087, "2": 0.20660285570621348, "5": 0.14420371379355434, "1": 0.07036955265959081}, "score": 3.220510129749431}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30428135370001314, "2": 0.29790411678686346, "4": 0.18378525414487396, "1": 0.1284340160890772, "5": 0.0855814435750559}, "score": 2.8001732315824617}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2952811871048754, "2": 0.2898738646796655, "4": 0.18382363251250156, "1": 0.13751010137891134, "5": 0.09349567504131212}, "score": 2.8059178992610008}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2976534168578836, "2": 0.2910029716520705, "4": 0.1863730068972543, "1": 0.13327662813377053, "5": 0.09167667446143572}, "score": 2.8121668780122913}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30441070075963894, "2": 0.29725411498247545, "4": 0.1855689440402807, "1": 0.12087968100023481, "5": 0.0918737984159969}, "score": 2.830300898392801}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2970990185358043, "2": 0.27926696244857, "4": 0.19378121772224466, "1": 0.13191234895828585, "5": 0.09792876033640338}, "score": 2.846545283837569}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29063775948498555, "2": 0.27432556074975245, "4": 0.20402015316353597, "1": 0.1339917162462417, "5": 0.09701334816477503}, "score": 2.855736202671693}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28910414282107194, "2": 0.27353458820926424, "4": 0.1977197608663814, "1": 0.14651978623795556, "5": 0.09311198224749702}, "score": 2.817367785908231}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2963126002484027, "2": 0.2700206611861026, "4": 0.2148895078353465, "1": 0.12247561867881977, "5": 0.09629113697302888}, "score": 2.8924987571537257}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29948303722765474, "2": 0.25168303016293264, "4": 0.23751549868869917, "5": 0.11143258386023637, "1": 0.09987838331251221}, "score": 3.008940936380934}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29368139198587107, "2": 0.2436330205482658, "4": 0.22967798873993753, "5": 0.11948377391117793, "1": 0.11350969808819354}, "score": 2.9979930914865927}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30018999143363406, "2": 0.26326556589777517, "4": 0.20108877535440045, "1": 0.13502008956803277, "5": 0.10041057987854086}, "score": 2.868600905380469}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30336311246392683, "2": 0.2422947787722408, "4": 0.22191893976100613, "1": 0.11732957779422276, "5": 0.11508085623277002}, "score": 2.9751264011011793}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31070346823393735, "4": 0.24406331491338892, "2": 0.22397792076469447, "5": 0.12788096611025807, "1": 0.09336273464816829}, "score": 3.08912289048216}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.283572657832461, "4": 0.25187629622290997, "2": 0.21111427593608512, "5": 0.1566756866878811, "1": 0.09674702469998964}, "score": 3.1606216023807874}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2965863416704358, "2": 0.2537713282351749, "4": 0.2137600830743892, "1": 0.12700618410104883, "5": 0.10886231068427958}, "score": 2.923699958709603}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3024928312920945, "4": 0.24548066315560113, "2": 0.23820865207204484, "5": 0.1199564642432637, "1": 0.09385136233175952}, "score": 3.0594828113350774}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2898091140912061, "4": 0.24316418630330458, "2": 0.22943110284973292, "5": 0.13906917608105993, "1": 0.09851536038175046}, "score": 3.0948417638298817}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3101696726825563, "2": 0.2446620031285215, "4": 0.2440612403840289, "5": 0.1136422071370759, "1": 0.0874573528880096}, "score": 3.0517693352547193}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28120922886707084, "4": 0.25971416969994704, "2": 0.21131735992938183, "5": 0.1607909025531122, "1": 0.08696000314527222}, "score": 3.196060242906241}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29393145061594567, "4": 0.25574641291412115, "2": 0.21906298232209742, "5": 0.1442727029272979, "1": 0.08697385697720167}, "score": 3.151283027787481}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29586310936234844, "2": 0.26749048055221225, "4": 0.1955211150535258, "1": 0.14535717348690502, "5": 0.09575727257689826}, "score": 2.8288289756523155}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30941415254054927, "2": 0.24413822943978192, "4": 0.23481366365096742, "5": 0.11175969422879452, "1": 0.09986804643478203}, "score": 3.0144588196420523}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3028617343187114, "4": 0.23970767952178493, "2": 0.23599496710740642, "5": 0.12277421019794252, "1": 0.09865148434972516}, "score": 3.0519586797749607}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29191707697703795, "2": 0.23321873242707888, "4": 0.23319338292863426, "5": 0.1365955922412036, "1": 0.10506819116002256}, "score": 3.06302989540267}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28515781931359757, "2": 0.26396995213077595, "4": 0.1978873202355624, "1": 0.14628023195651982, "5": 0.10669458198352441}, "score": 2.8547446018956073}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2725516885810827, "3": 0.2597137281862338, "1": 0.20829573629161605, "4": 0.16070937008571887, "5": 0.09869699290777405}, "score": 2.6689494409079466}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2655442196007145, "2": 0.2620888789798343, "1": 0.20541595639731963, "4": 0.16400132039521728, "5": 0.10290439764299397}, "score": 2.6968756145050223}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2665503293796015, "2": 0.2524639532156036, "4": 0.1909132390400549, "1": 0.17704339623326854, "5": 0.11300668530823736}, "score": 2.810371616901013}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26197764586160704, "2": 0.2555046167576663, "1": 0.20031771457626035, "4": 0.17275912426271323, "5": 0.10940616912990551}, "score": 2.735422227981927}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26619735745134, "2": 0.25918219733084086, "1": 0.1979841503953476, "4": 0.17251430817646948, "5": 0.10409893853531405}, "score": 2.7255553616951596}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3004134759735418, "2": 0.2396599345075855, "4": 0.23092753938152438, "5": 0.11939871980288519, "1": 0.1095929753548437}, "score": 3.0108791737861234}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3200504946037718, "2": 0.2777471809802368, "4": 0.20596333736255118, "1": 0.1161354612257908, "5": 0.08009484372108641}, "score": 2.856133672310118}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3082104962675546, "2": 0.24022648815495698, "4": 0.23602850437499878, "5": 0.1090289647938317, "1": 0.10649843380469437}, "score": 3.000863084337093}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2975412226696615, "4": 0.2546427491103931, "2": 0.2171467036883027, "5": 0.13838692677200756, "1": 0.09227317574737977}, "score": 3.129724743794523}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2859172058807585, "2": 0.23790831752745675, "4": 0.22773534312892363, "5": 0.12454707775175226, "1": 0.1238837070253635}, "score": 2.991153693199209}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27876501282218985, "2": 0.24771043891394545, "4": 0.20537169402815758, "1": 0.14338158157004435, "5": 0.1247613333475035}, "score": 2.92041996769787}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28535769941740685, "2": 0.24042732934090874, "4": 0.21805270049910988, "5": 0.13100687188754262, "1": 0.12514885627243608}, "score": 2.989341332653203}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2917600094768645, "2": 0.24018711825999942, "4": 0.22129522703650392, "5": 0.12921559378323522, "1": 0.11753595408396879}, "score": 3.004467415414475}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28835419809534807, "2": 0.23500424527526986, "4": 0.22326231463672905, "5": 0.13559609524754607, "1": 0.11777671415646694}, "score": 3.023896985263093}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27796410286886963, "2": 0.23653629868868803, "4": 0.21859973838835473, "1": 0.13350300393623055, "5": 0.13339024154672358}, "score": 2.981837794785454}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "human", "scores": {"3": 0.291135786607463, "2": 0.27137770040735704, "4": 0.20528861744827923, "1": 0.13409314614908915, "5": 0.09809303636467018}, "score": 2.861909080009943}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2936203126088134, "2": 0.2723874984090111, "4": 0.20772958857775292, "1": 0.12950906503787238, "5": 0.09674172310830101}, "score": 2.869805868422894}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3017369402422284, "2": 0.27451773822303377, "4": 0.21918713857802688, "1": 0.10971586505070283, "5": 0.09483478563007311}, "score": 2.9149066005667685}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29670562301832926, "4": 0.252575617462861, "2": 0.2318652720323058, "5": 0.12897002061016047, "1": 0.0898732710859454}, "score": 3.0989048528921352}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3100575356045198, "2": 0.2510999027787687, "4": 0.2417380202906631, "5": 0.10794442150634542, "1": 0.08914986936619254}, "score": 3.028227511136991}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3045965697728344, "2": 0.25219116191968655, "4": 0.23366617143771654, "5": 0.10889060767586121, "1": 0.10064494013930478}, "score": 2.9979663231377742}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29120622087292425, "4": 0.25494733106504386, "2": 0.22411479067914836, "5": 0.143892440424853, "1": 0.08582922609600895}, "score": 3.1469604373050357}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.294725283173079, "4": 0.2521741143733543, "2": 0.2392605867235132, "5": 0.1238642340372361, "1": 0.08996554637508684}, "score": 3.0807117290843316}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29824785797741826, "4": 0.2638059193951873, "2": 0.22430976566395958, "5": 0.1327403253812297, "1": 0.08088571876351935}, "score": 3.1432068581536976}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30044613269324066, "4": 0.2491337196394963, "2": 0.23411716120899126, "5": 0.12910473562067704, "1": 0.08718318493292132}, "score": 3.0988611492386666}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3184671019135693, "2": 0.2732360787932723, "4": 0.20875666241499793, "1": 0.11244706515816155, "5": 0.08708531575322512}, "score": 2.8847961889908467}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3208266605468909, "2": 0.27290858318597, "4": 0.21291388304053888, "1": 0.10842828416282936, "5": 0.08491484059986878}, "score": 2.892977583469317}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31177247624625204, "2": 0.25740334205699283, "4": 0.23372826478820388, "5": 0.10225058119670763, "1": 0.09483836096888608}, "score": 2.991149301455507}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31112211224274094, "4": 0.26037257316034546, "2": 0.2322720186428633, "5": 0.11940341226477973, "1": 0.07682328459108315}, "score": 3.1132615572890128}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30500427075419156, "4": 0.24270258871257927, "2": 0.24166142564909496, "5": 0.11689662286671304, "1": 0.09372577945409721}, "score": 3.047383291148615}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29965918503592504, "4": 0.2856173788651054, "2": 0.1951928958258929, "5": 0.16176658760146057, "1": 0.057756267923379914}, "score": 3.2984474158886266}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.31690085952436514, "3": 0.2750379749835381, "5": 0.208400243641192, "2": 0.15508836930093026, "1": 0.04456392962392129}, "score": 3.489489339088351}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.2941153328391386, "3": 0.2922442949352911, "2": 0.18686160805257296, "5": 0.17378956643020377, "1": 0.05297725015178841}, "score": 3.348882525649122}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.33635030086874873, "3": 0.2614427365879792, "5": 0.23182122181552273, "2": 0.13742866451883404, "1": 0.03294892973659004}, "score": 3.5966710812722313}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.32104091593596323, "3": 0.27828324975241625, "5": 0.20495420808311557, "2": 0.15553213698532017, "1": 0.04018206609245947}, "score": 3.495056737812738}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.263460032980045, "2": 0.24830918390984755, "4": 0.19810343216723042, "1": 0.16450187675447459, "5": 0.1256057808665047}, "score": 2.871999535727097}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27401602195919256, "2": 0.25768687343747554, "4": 0.19593690203001263, "1": 0.1530750584162047, "5": 0.11926821673499267}, "score": 2.870634155399854}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2672377412769852, "2": 0.2560923390819878, "4": 0.19144904295510576, "1": 0.16938942922168143, "5": 0.11581424587924964}, "score": 2.828203382014129}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2805546899332757, "2": 0.23566296714232057, "4": 0.22782283307558807, "5": 0.1347408196864955, "1": 0.12120736983210742}, "score": 3.0192269832978433}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2724941862415023, "2": 0.2599240255736995, "4": 0.1940701863573854, "1": 0.16199127552239592, "5": 0.11150381203630166}, "score": 2.833168478710925}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27089158323825113, "4": 0.23238079386428415, "2": 0.22104088380080322, "5": 0.14905767014014, "1": 0.12661706293959712}, "score": 3.056221799464443}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28567107998007873, "4": 0.23492118595616462, "2": 0.22893189990081192, "5": 0.14018236456356054, "1": 0.11028421198534424}, "score": 3.0657862002350362}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2755451995896195, "2": 0.2445743808930801, "4": 0.2133797578605296, "1": 0.14173439933960194, "5": 0.12475351105713398}, "score": 2.9348427695657255}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27292564050545487, "4": 0.24558167467706862, "2": 0.21350427993082152, "5": 0.15859937666855328, "1": 0.10937811004625503}, "score": 3.1305213530454052}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2829351951399529, "4": 0.26119458840471976, "2": 0.20574690131001916, "5": 0.15908869533450776, "1": 0.09102489849995785}, "score": 3.191577143144759}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2997077637270159, "4": 0.2664166879028188, "2": 0.21752593373460294, "5": 0.14277186104492207, "1": 0.07356557453255128}, "score": 3.1873056083988427}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2956766264668059, "4": 0.27640425302401594, "2": 0.20561355882153776, "5": 0.15666738309653375, "1": 0.06562785199783738}, "score": 3.2528723677099607}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29935512539806325, "4": 0.24546627841021737, "2": 0.235274632086015, "5": 0.13106747657954537, "1": 0.08882705517446626}, "score": 3.0946733821269965}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29002188306606297, "4": 0.2623895099594494, "2": 0.21615005789978323, "5": 0.1528357444439467, "1": 0.07859045693176588}, "score": 3.194732431581477}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28720658896285817, "4": 0.24995811878843627, "2": 0.23010319425675313, "5": 0.14126850622719092, "1": 0.09145317374915503}, "score": 3.1194868343034594}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27618664274051274, "2": 0.24538558236503294, "4": 0.21754807900183212, "1": 0.14344726537484656, "5": 0.1174217646416585}, "score": 2.920110643080439}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.306305380250678, "2": 0.24362174060054723, "4": 0.23687104496559597, "5": 0.11027026191488867, "1": 0.10292285005570073}, "score": 3.0079441973744037}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.302769799452591, "4": 0.24503289797569597, "2": 0.23237600686923676, "5": 0.11896413712366265, "1": 0.10084423301548152}, "score": 3.0488973313483747}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2841678483740971, "4": 0.2472767065387511, "2": 0.2246448428738248, "5": 0.13909275030426463, "1": 0.10480944364903999}, "score": 3.0911992438023317}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2884702551737798, "4": 0.25525674428860984, "2": 0.2191010806872801, "5": 0.1406047241839084, "1": 0.09655890908990512}, "score": 3.1242483233825746}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2737267316507718, "2": 0.24910509581957965, "4": 0.19119450850221945, "1": 0.166067989363402, "5": 0.11989387529858088}, "score": 2.8497394115734025}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2718389727344877, "2": 0.2671221592323076, "4": 0.1794221984199948, "1": 0.1782994747491291, "5": 0.1033079960245346}, "score": 2.762314895311358}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28165366531595376, "2": 0.2598712143775021, "4": 0.19234533552747773, "1": 0.15933918657614324, "5": 0.10678141333983356}, "score": 2.8273569889749366}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28004051215810255, "2": 0.2680184386245705, "4": 0.18634699104144045, "1": 0.16620390517428207, "5": 0.09938297079165773}, "score": 2.7846851372150723}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27092921269246806, "2": 0.2514864167115731, "4": 0.19622274714767554, "1": 0.16192770642300525, "5": 0.11942305574172896}, "score": 2.8597255055124906}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "human", "scores": {"3": 0.25939102675689263, "2": 0.242564263400131, "4": 0.2028181326039453, "1": 0.15965992412391558, "5": 0.13555306387635438}, "score": 2.9120389533850273}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2683725102384882, "4": 0.23266984605230165, "2": 0.2222922325317707, "5": 0.1526928487313378, "1": 0.12394842838605488}, "score": 3.0678680921437076}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2637006818296392, "4": 0.2347309064213491, "2": 0.21654718731993766, "5": 0.16006279051728545, "1": 0.12494386781704168}, "score": 3.088422852477546}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26618484646955015, "4": 0.2324563531418645, "2": 0.22286479318251343, "5": 0.15442105254597574, "1": 0.12406092542122632}, "score": 3.0703126600166333}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2659023879876709, "4": 0.24728778478335492, "2": 0.209197813200184, "5": 0.16411763856129477, "1": 0.11348100646329107}, "score": 3.139365098951772}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3108563097802704, "3": 0.30475835350116226, "4": 0.16874391654213508, "1": 0.14859337952687693, "5": 0.06703851325755503}, "score": 2.694774966224676}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31092856118195106, "2": 0.2797141752123383, "4": 0.20396948085125188, "1": 0.11965364514823461, "5": 0.08572523837010844}, "score": 2.856397214127562}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31711125643732374, "2": 0.30085916924017747, "4": 0.1872104114060266, "1": 0.12285757762352804, "5": 0.07195034864527301}, "score": 2.784534363097892}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3055343402430757, "2": 0.24222319124269198, "4": 0.24119971396811016, "5": 0.11451636963064846, "1": 0.09651618157303893}, "score": 3.034977255725554}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29313981484784596, "2": 0.26750618270427434, "4": 0.2017821961858558, "1": 0.13786831341883907, "5": 0.09968786744909862}, "score": 2.85791290137519}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29305112415945095, "2": 0.24127900934557278, "4": 0.23475299563892474, "5": 0.1185692382509235, "1": 0.11233942615502336}, "score": 3.0059336591794303}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3035120396232595, "4": 0.24757146281596754, "2": 0.23680274120610348, "5": 0.1183414723639123, "1": 0.09376412113823385}, "score": 3.059923913211287}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30765418585150384, "4": 0.2500762519063151, "2": 0.2340424897452973, "5": 0.11780253364192222, "1": 0.09041764884976806}, "score": 3.070804019585389}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3022472161353372, "4": 0.2528136557929623, "2": 0.22861820359900317, "5": 0.1249815190762923, "1": 0.09133019711579266}, "score": 3.0914989386628617}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29837267099025755, "4": 0.27776404074581107, "2": 0.20683682119439628, "5": 0.1466261982256419, "1": 0.0703952281553267}, "score": 3.223390285732904}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3537623567120428, "3": 0.2746892280926925, "1": 0.22926207442155938, "4": 0.101043859896693, "5": 0.041222353874293766}, "score": 2.371189406017585}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2981921504807903, "2": 0.28760556601555637, "4": 0.17982764762409478, "1": 0.15453549004411762, "5": 0.07982558594808711}, "score": 2.7427987857969858}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32254448960412346, "2": 0.2719253768889157, "4": 0.20776079190526855, "1": 0.10729835074144557, "5": 0.0904620457699209}, "score": 2.902161929902929}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.3007470899953786, "3": 0.29679912969134503, "4": 0.1673437163471777, "1": 0.1565525723270152, "5": 0.07854379591675405}, "score": 2.7105751096483433}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3052242581293242, "2": 0.27793052683327646, "4": 0.19608302745195935, "1": 0.1290834092799568, "5": 0.09166802059183563}, "score": 2.843320037724272}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "human", "scores": {"2": 0.26332899421223366, "3": 0.26190443334151503, "4": 0.18900717531755226, "1": 0.17203063630112847, "5": 0.11371983990502142}, "score": 2.809054884906522}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2623780700262075, "2": 0.24274984750709597, "4": 0.21130132155042733, "1": 0.14494508970108985, "5": 0.1386178794757018}, "score": 2.955896709951209}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2755978337491434, "2": 0.24778706760271738, "4": 0.21475208697593234, "1": 0.13415256257259928, "5": 0.12769590293172892}, "score": 2.954051031710068}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26589334746016924, "2": 0.22974051559799186, "4": 0.2290575034915433, "5": 0.15150581074738811, "1": 0.12379350298946439}, "score": 3.0547421135902106}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2743012565817606, "2": 0.23929772284826142, "4": 0.22312915606496836, "5": 0.13448525691004667, "1": 0.12877690376321077}, "score": 2.9952480933986765}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30376351241498445, "2": 0.28455446574367876, "4": 0.19241730537861984, "1": 0.13997762368060027, "5": 0.07927605900673712}, "score": 2.786457354105626}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3140548898222401, "2": 0.26111357840869653, "4": 0.2208248998229693, "1": 0.10853903512133889, "5": 0.09545980596861993}, "score": 2.933552345424718}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29979322259203683, "2": 0.2799896614184815, "4": 0.19691543625310837, "1": 0.1373873459319741, "5": 0.08590596596147214}, "score": 2.8139614581523267}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.31433185126043806, "2": 0.2780479216809356, "4": 0.2043567577561331, "1": 0.11866035813441406, "5": 0.08459417230722883}, "score": 2.858175196668644}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3014542245639861, "2": 0.26773617633179664, "4": 0.2104449458441527, "1": 0.12385774372142026, "5": 0.0964976811943493}, "score": 2.887987610769321}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30637216210253004, "2": 0.27534354677302014, "4": 0.19916254074178252, "1": 0.12178206306830712, "5": 0.09731543201023159}, "score": 2.8748826970943773}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3143509317828976, "2": 0.2899512423397379, "4": 0.1904617484720102, "1": 0.12069850947025657, "5": 0.08451916209267485}, "score": 2.828148648308209}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30819551760142055, "2": 0.292208029668596, "4": 0.18373067802934726, "1": 0.135541962535029, "5": 0.080306252243153}, "score": 2.7810473829860234}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30693042062427445, "2": 0.26343637533132774, "4": 0.21304328882537063, "1": 0.11214265643592358, "5": 0.10442841147416368}, "score": 2.934177182987556}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3143300910069997, "2": 0.26657978481838096, "4": 0.21200434695831194, "1": 0.1048149358077805, "5": 0.10225633806648335}, "score": 2.9403065009021017}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29247467419720824, "2": 0.26938788131516384, "4": 0.19392144977096157, "1": 0.1511844143871231, "5": 0.09302180973902338}, "score": 2.808206485223701}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30434961166249247, "2": 0.2916491909005856, "4": 0.17902339202062853, "1": 0.1486249441127288, "5": 0.07634508683078028}, "score": 2.742812487058826}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2977681248164681, "2": 0.28061327586869256, "4": 0.19113327870762126, "1": 0.14385454414720397, "5": 0.08661961395246802}, "score": 2.7960478658322203}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29835193481021427, "2": 0.2702989257487731, "4": 0.19827423129184385, "1": 0.1380154284102251, "5": 0.09505030511552348}, "score": 2.8420436097632704}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2809207718825053, "2": 0.2692771048623181, "4": 0.19679137923965237, "1": 0.1521657943912833, "5": 0.1008341692632162}, "score": 2.824849135931651}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2724724148258012, "2": 0.23286073685712483, "4": 0.22902852954999206, "5": 0.14085623763244126, "1": 0.12476909374378352}, "score": 3.02834244856464}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2836760105386946, "4": 0.2723437564893368, "2": 0.20580379819386307, "5": 0.1650786915972427, "1": 0.07308687331248173}, "score": 3.250526318053099}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27922864964964017, "4": 0.26952549284226396, "2": 0.20119604459909865, "5": 0.1660688529191919, "1": 0.08396974698085748}, "score": 3.232530267483804}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28923880997519674, "4": 0.2752891167344097, "2": 0.2015637642023612, "5": 0.15964573098755522, "1": 0.07425405425715795}, "score": 3.2445107901645085}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3043070056993467, "3": 0.27269214338909153, "5": 0.19532340636922757, "2": 0.17052274319182084, "1": 0.05714325034017954}, "score": 3.4101492711891646}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "human", "scores": {"3": 0.282449925210319, "2": 0.26179259784220577, "4": 0.19032436084972845, "1": 0.17069092739643366, "5": 0.09472749339160406}, "score": 2.7766016120893644}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28851733736122614, "2": 0.2609352204435083, "4": 0.20794366028199, "1": 0.13703454933777887, "5": 0.10555715702743534}, "score": 2.884052255085228}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30124376243548046, "2": 0.24978413353032097, "4": 0.22664723524843275, "5": 0.11190038758470164, "1": 0.11041690851805694}, "score": 2.979829907109681}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.32881088865536917, "4": 0.2548099514807237, "2": 0.2386897470138429, "5": 0.10262746417996337, "1": 0.07505350648565753}, "score": 3.0712687215191843}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31204027904564696, "2": 0.2484013485480874, "4": 0.23074637854542812, "5": 0.10920515607303227, "1": 0.09959662505058323}, "score": 3.001562107995637}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30029750871938743, "2": 0.2543958654017125, "4": 0.2181144835803215, "1": 0.12230822327459409, "5": 0.10487608170675462}, "score": 2.928853777447414}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2974377855701211, "2": 0.2653871170227927, "4": 0.20959520577661886, "1": 0.1295138828647028, "5": 0.09805801359507205}, "score": 2.8812954011510348}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.315813509316259, "2": 0.262493620527016, "4": 0.21672140461136385, "1": 0.11109380994004046, "5": 0.09386941168412549}, "score": 2.919778326231361}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29472495897544576, "2": 0.27547414564544526, "4": 0.1971430444062255, "1": 0.14035695818853414, "5": 0.09229165991560966}, "score": 2.8255366914181037}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31714680660171984, "2": 0.26754363619153587, "4": 0.21980479982777976, "1": 0.10516560298156684, "5": 0.09033322012501023}, "score": 2.9225959385863463}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2902170464226368, "2": 0.2589231964660566, "4": 0.2095324623651667, "1": 0.13572577352485143, "5": 0.10558323286545453}, "score": 2.8903221787532947}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28926333846627594, "4": 0.23965042019704583, "2": 0.23654374969944952, "5": 0.1290021252435462, "1": 0.10552932527490505}, "score": 3.0500528230740436}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2967699854478151, "2": 0.24579362940133723, "4": 0.2283274719521645, "5": 0.12021597045796893, "1": 0.10888130881503269}, "score": 3.0052032263706487}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28111211597178265, "2": 0.23397118786206544, "4": 0.2327365155131399, "5": 0.13640833887421655, "1": 0.11576118037125314}, "score": 3.0400600717537527}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28422511396485894, "2": 0.24965792452493688, "4": 0.21819205888275398, "1": 0.1260192885520943, "5": 0.1218925938851205}, "score": 2.9602802278648808}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28516894068541615, "4": 0.2630333365221542, "2": 0.21324421942750532, "5": 0.15390696230681072, "1": 0.0846366830972123}, "score": 3.1883315320787258}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2848050978073651, "4": 0.26096979665084025, "2": 0.21649684595129667, "5": 0.15156959296515785, "1": 0.08614919157289945}, "score": 3.1753154146068074}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3031262177435953, "4": 0.2807472445543482, "2": 0.19993045458103706, "5": 0.15358289886210447, "1": 0.06260508338122758}, "score": 3.26277454963955}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2877610300660342, "4": 0.27410418709405837, "2": 0.19356836914568396, "5": 0.17707050365225183, "1": 0.06748738415360336}, "score": 3.2997046121937377}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2931408115249108, "4": 0.27017299579333265, "2": 0.21328706449483117, "5": 0.1458625265250851, "1": 0.0775283424845642}, "score": 3.1935558979920176}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2890987944439024, "2": 0.2562265153869054, "4": 0.2160802527052274, "1": 0.13109679965371976, "5": 0.10748245005976606}, "score": 2.9126237110811406}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29595140808769677, "2": 0.24100222817374742, "4": 0.23095673046734, "5": 0.11987065410398089, "1": 0.11220885134637391}, "score": 3.0052781612650783}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28778442598880993, "2": 0.23678912543994116, "4": 0.224332870759715, "5": 0.12797056531289963, "1": 0.12311199616144007}, "score": 2.997260853447331}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29893049225223817, "4": 0.24374784747864836, "2": 0.23109120951647502, "5": 0.12526688972557104, "1": 0.10095259790326853}, "score": 3.0612858934916156}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3025463470072755, "2": 0.23822125364304808, "4": 0.2317408169806999, "5": 0.11893325804194355, "1": 0.10854782713925562}, "score": 3.014290575153878}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28664329809464, "2": 0.23840513609508593, "4": 0.22366378824696073, "5": 0.12738340542739748, "1": 0.12389214379308061}, "score": 2.992241080541781}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2866555666903446, "2": 0.23096287399807902, "4": 0.2226488304703635, "5": 0.14001500269599948, "1": 0.11970019947042591}, "score": 3.0323161293177203}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29413453919745375, "2": 0.2352885372276642, "4": 0.23030017782747972, "5": 0.12846844101812355, "1": 0.1117953512582473}, "score": 3.028358187456528}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28621963738794204, "2": 0.23937545937237067, "4": 0.22505307853473708, "5": 0.12861621326112882, "1": 0.12072170995327179}, "score": 3.001466646166648}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28990873860321087, "2": 0.2519981834571672, "4": 0.21187250006929617, "1": 0.13170021996985687, "5": 0.11450589186219248}, "score": 2.925484582453918}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3198940281710712, "2": 0.29251781739338484, "4": 0.17305143786125415, "1": 0.14786100528184903, "5": 0.06666359347764987}, "score": 2.718135381276225}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31488943555780213, "2": 0.2490405610500932, "4": 0.23128323361166642, "5": 0.10471083293814536, "1": 0.10006968356712911}, "score": 2.9915249183065877}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3275678401048982, "2": 0.2724883821771488, "4": 0.2132309347264577, "1": 0.10381267561026875, "5": 0.08289338623994642}, "score": 2.898903288257579}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3057855009857127, "4": 0.24006321367710884, "2": 0.23431706550310544, "5": 0.12210400468504708, "1": 0.09772615973907874}, "score": 3.054502059094133}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31518862810384435, "2": 0.25106414869836396, "4": 0.22560170539766328, "1": 0.11172249561863794, "5": 0.09641686929387669}, "score": 2.943925959032505}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2845170777433255, "4": 0.2575329515193489, "2": 0.21911468728687133, "5": 0.144394029547813, "1": 0.09443096882911699}, "score": 3.138345808566682}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.31429856527991334, "3": 0.269224816325935, "5": 0.19631271627431643, "2": 0.16789914621365276, "1": 0.05225605028043815}, "score": 3.4345165337923396}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.30219744011800725, "3": 0.2927785961932022, "2": 0.18121188445935346, "5": 0.16998299097937788, "1": 0.05382133656543522}, "score": 3.353311603246662}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3411231238018432, "3": 0.2659757339802254, "5": 0.21260553045152564, "2": 0.1446211810057758, "1": 0.03566703165225163}, "score": 3.550383012738176}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.302006904284316, "3": 0.2579622300325553, "5": 0.21538346098655975, "2": 0.1649431681281644, "1": 0.05969574106936063}, "score": 3.4484429857375067}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27384443207060105, "2": 0.252862150102599, "4": 0.20096542512956211, "1": 0.15743238727963027, "5": 0.1148730584343425}, "score": 2.8629815279831927}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2723404883838676, "2": 0.23980252663932664, "4": 0.20869362742171169, "1": 0.1453840670515781, "5": 0.13374977171650015}, "score": 2.9456209049073028}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28187053759473696, "2": 0.2422837061538622, "4": 0.21848174824390443, "1": 0.13036340570115232, "5": 0.126979477508829}, "score": 2.9694295399106165}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2696378814460066, "2": 0.23318750652942738, "4": 0.2222355107920304, "5": 0.1419120470857706, "1": 0.1330077342760058}, "score": 3.0068567623538955}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.272205903745793, "4": 0.2348012188565839, "2": 0.22265838231007623, "5": 0.14818956206660272, "1": 0.12211915873231766}, "score": 3.064285300122958}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3081144112152565, "3": 0.28582855670098056, "1": 0.17065715100418619, "4": 0.16818930810859892, "5": 0.06719597023447463}, "score": 2.653147470357823}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.300561916892561, "3": 0.28614522995560654, "4": 0.18511998436416766, "1": 0.14980353650501746, "5": 0.07835992053561855}, "score": 2.7416684041811794}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27439812945735925, "2": 0.26476233618143635, "4": 0.20627104966359572, "1": 0.1486485624927789, "5": 0.10591326230346655}, "score": 2.8560371543251817}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27908625143720567, "2": 0.24669754669093052, "4": 0.21433291397185003, "1": 0.13145837728706136, "5": 0.12841634478427702}, "score": 2.961550972927572}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2754421374094358, "2": 0.24138722311307687, "4": 0.22258723206150524, "1": 0.13178403430831573, "5": 0.12879117303465074}, "score": 2.97521408315477}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2894137945174614, "2": 0.24207499600202062, "4": 0.23568071323187828, "5": 0.11951991126810167, "1": 0.1132980411673616}, "score": 3.006049533315553}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.28659864254755435, "3": 0.2748218251072561, "2": 0.1923222362398209, "5": 0.1756060579148565, "1": 0.07063800251881143}, "score": 3.3042165436101203}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2901304585755336, "4": 0.2582364347374901, "2": 0.21579590548376307, "5": 0.14772697092322543, "1": 0.08809713204280624}, "score": 3.161702325029972}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2989295655691485, "4": 0.27714731252171915, "2": 0.20719995205326439, "5": 0.14376677650393146, "1": 0.07294283695447025}, "score": 3.211598108075434}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2827991643158434, "4": 0.2673503255221886, "2": 0.20905468720013373, "5": 0.148511675638766, "1": 0.09226490844121366}, "score": 3.1707924585730916}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28320906740559604, "4": 0.2687970083621967, "2": 0.2050844773691009, "5": 0.16651353193187246, "1": 0.07637632599533818}, "score": 3.243991722404374}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2800358915277722, "4": 0.24012571026520704, "2": 0.22676310425817137, "5": 0.15256508303145933, "1": 0.10049316135672455}, "score": 3.1175084528240005}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2771741139626687, "4": 0.2703776752951583, "2": 0.19868413035038895, "5": 0.1790062065999079, "1": 0.07474396543027137}, "score": 3.280221924711901}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.29037522878410293, "3": 0.2778511612087635, "5": 0.19226337541241706, "2": 0.18075810102477907, "1": 0.05873563303199011}, "score": 3.376678827923471}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2620276621681066, "4": 0.252203040403149, "2": 0.20552592444200732, "5": 0.17995043988059228, "1": 0.10027754374088052}, "score": 3.2060260788511465}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2837213172152194, "3": 0.2750918051823555, "4": 0.18026377213388664, "1": 0.16027243387495851, "5": 0.1006385594523699}, "score": 2.7772720083606033}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2883349943452469, "2": 0.280630421863653, "4": 0.19516605864781508, "1": 0.13599706151321325, "5": 0.09986319296566556}, "score": 2.842266595129009}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2843264867141858, "3": 0.2701882069611862, "4": 0.17918979994698642, "1": 0.16758553522479386, "5": 0.09870144424253102}, "score": 2.7570930600225823}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.28675232927186967, "3": 0.2809208280666653, "4": 0.18887202682666776, "1": 0.15076066494099, "5": 0.0926854014938531}, "score": 2.7859672980028116}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2751877464212054, "2": 0.2552391832287102, "4": 0.2064046946987353, "1": 0.1427804990038109, "5": 0.12037893739387912}, "score": 2.906361551192316}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2703429610303539, "3": 0.25539038063815245, "1": 0.19878103235513667, "4": 0.17388561169571784, "5": 0.10158473512076575}, "score": 2.7091456121859308}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27432701467907733, "2": 0.2623284590240337, "4": 0.19097711020036978, "1": 0.16424269458812843, "5": 0.10811270837077434}, "score": 2.8163864729670594}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2720817245255575, "2": 0.2547828156658988, "4": 0.20377629091904326, "1": 0.15025120284122945, "5": 0.11909629635973418}, "score": 2.8866823399083548}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26981579326147476, "2": 0.23651470391043436, "4": 0.21462984194407161, "1": 0.14555247565051183, "5": 0.13347276893008272}, "score": 2.9539550607949643}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26959668392529235, "2": 0.25084639482271964, "4": 0.20180154802637595, "1": 0.1549268204001996, "5": 0.12281555523456249}, "score": 2.8867311506502222}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26887537411138734, "2": 0.24248556406631522, "4": 0.22639590958961545, "5": 0.1323919815002707, "1": 0.12984169517299593}, "score": 2.989010814049166}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.25675634955055066, "4": 0.25356086148834195, "2": 0.20843786328023955, "5": 0.1755715020430682, "1": 0.10566321076519183}, "score": 3.1849414695475233}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2695409910036703, "4": 0.24783774523965388, "2": 0.2197689965421446, "5": 0.15232508878228332, "1": 0.11051670422414538}, "score": 3.1116866876433944}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2582730036056637, "3": 0.2557118639075744, "2": 0.20154147248279525, "5": 0.17991954504246258, "1": 0.10454437045895654}, "score": 3.207483902117293}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27549612935940626, "4": 0.244964494340173, "2": 0.23368703875853797, "5": 0.1404377709093373, "1": 0.10540917471830298}, "score": 3.0813350865155154}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.25678616069323684, "2": 0.25640637262828564, "1": 0.1987630633620225, "4": 0.17460566334352692, "5": 0.1134171459799721}, "score": 2.747502003511183}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2666282267661001, "2": 0.24578596075973136, "4": 0.18497881018583368, "1": 0.18388128864366635, "5": 0.11869394376790908}, "score": 2.808812085658111}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2682946398355589, "2": 0.24029003646496747, "4": 0.19297722542874868, "1": 0.17217260291909464, "5": 0.12624197212211255}, "score": 2.8608226534691505}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2741224156285922, "2": 0.2401523416831603, "4": 0.1992741029991145, "1": 0.16214164077147827, "5": 0.12428749362106169}, "score": 2.883410901437427}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2698119888856107, "2": 0.24262952196386897, "4": 0.19047407174578995, "1": 0.17347459791950806, "5": 0.12358948628446279}, "score": 2.848071237313798}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2705445768507614, "4": 0.26395802095858617, "2": 0.20021816138633988, "5": 0.1784691003553811, "1": 0.08680057785693777}, "score": 3.247079267287356}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2756281511782838, "4": 0.25847176947282546, "2": 0.20612196959362827, "5": 0.17147501639245383, "1": 0.08829489387980864}, "score": 3.2187118382284874}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2682304446095114, "4": 0.26493713700124133, "2": 0.19412703784046276, "5": 0.18710150535691744, "1": 0.08559417904135508}, "score": 3.273827406863655}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27352706611151784, "4": 0.2676452953278553, "2": 0.19740836045843577, "5": 0.1790942097754606, "1": 0.08231402275242035}, "score": 3.263800222740463}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.269049688721897, "4": 0.2438737025979285, "2": 0.21465368864417128, "5": 0.16165651055425362, "1": 0.1107512592409596}, "score": 3.1310325017542984}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2649676595174871, "2": 0.24353785171957884, "4": 0.1990646166857448, "1": 0.15691210047583404, "5": 0.13548254041370966}, "score": 2.9126645679109213}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.25853543891021596, "2": 0.22253165896824895, "4": 0.22242217807885287, "5": 0.16214754283461924, "1": 0.13433532224756897}, "score": 3.0555165069168777}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26458021588358427, "2": 0.2334475855710794, "4": 0.21478445255412465, "5": 0.1469540979220614, "1": 0.14021897095770486}, "score": 2.9948070446941752}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27274401436753776, "2": 0.22988472301187382, "4": 0.22166700515068216, "5": 0.15154626819968722, "1": 0.12414557624533766}, "score": 3.0465842442988915}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2716413361288815, "2": 0.23656626973635766, "4": 0.22113409428480305, "5": 0.140233344138841, "1": 0.13041051450932586}, "score": 3.004213544656125}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2555805128988624, "2": 0.24808831185868147, "4": 0.19950507587368926, "1": 0.16715056264724126, "5": 0.12966453030038952}, "score": 2.876443339404664}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26644197204621445, "2": 0.26207213203553803, "4": 0.18809713011908957, "1": 0.16862526380629872, "5": 0.11475360665393847}, "score": 2.8182798855967097}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.27553638228431027, "3": 0.2668171998005564, "1": 0.18095778626006936, "4": 0.1727676587742525, "5": 0.10391194719995224}, "score": 2.743137280008773}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2610496134180178, "2": 0.25730063288015737, "4": 0.19078082937303376, "1": 0.16762043016566497, "5": 0.12324009923950223}, "score": 2.844718231061961}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2627376955020057, "2": 0.2594648080561057, "4": 0.19202183297649336, "1": 0.168388983156467, "5": 0.11737656596357533}, "score": 2.830530476461316}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27463569637897217, "2": 0.2688982563793509, "4": 0.1810818753492267, "1": 0.16964409420490706, "5": 0.10572953523707371}, "score": 2.7843522275782497}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2870972702245822, "2": 0.24899899964884936, "4": 0.20479794910554647, "1": 0.13925389907892022, "5": 0.11984143320068316}, "score": 2.916973150174138}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2907230741867144, "2": 0.2665505426199503, "4": 0.1913556003435325, "1": 0.14916667113202114, "5": 0.1021934595332141}, "score": 2.8308568327817327}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2967316749156918, "2": 0.27158310246928685, "4": 0.18952796363313346, "1": 0.14589823804248983, "5": 0.09624964443527771}, "score": 2.8186459734826457}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.279805992471031, "2": 0.2713747695440193, "4": 0.18104024941116886, "1": 0.1682906895288192, "5": 0.09947281382903635}, "score": 2.7720261982440384}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2878290648149323, "4": 0.2695340908426231, "2": 0.20572295376448085, "5": 0.15503273357567104, "1": 0.08187230513091381}, "score": 3.2101338540455053}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29913688529603666, "4": 0.25103708544187, "2": 0.22652551305116672, "5": 0.13393140675227339, "1": 0.08936282598509025}, "score": 3.1136494480383714}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2998856630915328, "4": 0.2847585075045545, "2": 0.1965183240220323, "5": 0.15502913685797418, "1": 0.06379979511501184}, "score": 3.2707011878004177}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2962440414452646, "4": 0.288803688566604, "2": 0.19672924233402228, "5": 0.1542582396683956, "1": 0.06395579099590457}, "score": 3.2726817968929116}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29482556577151725, "4": 0.27093598600745145, "2": 0.1984899916550143, "5": 0.1618922319488985, "1": 0.0738481663276158}, "score": 3.248536128371077}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32654200048294385, "2": 0.28591829236820515, "4": 0.1921997275463037, "1": 0.12024432072616818, "5": 0.07507665655661518}, "score": 2.8159426093216}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3171116052598977, "2": 0.2964827918007839, "4": 0.1811906839091281, "1": 0.1333699544338584, "5": 0.07182758388741424}, "score": 2.7616190077848186}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3424564098124615, "3": 0.32313473710480206, "4": 0.14385257335344914, "1": 0.14240923921232368, "5": 0.04812716983067236}, "score": 2.6128243313314337}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3194766151059101, "2": 0.28219321022648086, "4": 0.19991382105918004, "1": 0.11631591319150167, "5": 0.08208938207986255}, "score": 2.849265881740735}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32085929027746224, "2": 0.3143293994815602, "4": 0.16956604195395447, "1": 0.13370585550290542, "5": 0.0615263648060637}, "score": 2.7108738885675545}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32425595191810147, "2": 0.30814448464935085, "4": 0.19604571640209423, "1": 0.10562225307853874, "5": 0.06592108066052811}, "score": 2.8084968735885525}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.35101623606171206, "2": 0.3033999429813471, "4": 0.19356434296547817, "1": 0.09035552615062464, "5": 0.06165331990315701}, "score": 2.8327582093848998}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3422735526803247, "2": 0.26449000941104567, "4": 0.23603421633391908, "5": 0.08351616274904117, "1": 0.07367844441316668}, "score": 2.991219576736858}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3562075900355507, "2": 0.3134115800494065, "4": 0.2043118450768626, "1": 0.07203030109185406, "5": 0.054028937301197635}, "score": 2.8548961231991705}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3417950125935485, "2": 0.3195678067442892, "4": 0.1877510304382671, "1": 0.09530071173374247, "5": 0.05557611257439041}, "score": 2.788732055108216}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "human", "scores": {"3": 0.25497068531017747, "2": 0.23955386053578503, "4": 0.2052020244486555, "1": 0.1607987975802489, "5": 0.13946533544967493}, "score": 2.9229805236266464}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2638317472589494, "2": 0.24491090197203025, "4": 0.2094530227181468, "1": 0.1511404261231393, "5": 0.13065651790115504}, "score": 2.923573739968613}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26265158419983364, "2": 0.2552591181873704, "4": 0.19489293938202956, "1": 0.1678054846240793, "5": 0.11937859087564269}, "score": 2.8427781025835057}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26197720049998763, "2": 0.22744655301366457, "4": 0.22556595036101926, "5": 0.14942962989654318, "1": 0.13556866693194516}, "score": 3.025841633357981}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26099579053706073, "2": 0.23394484418948877, "4": 0.21763716141930206, "1": 0.14909149516279846, "5": 0.13831750163237766}, "score": 2.962143830200305}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29922041597475146, "2": 0.24530059551987304, "4": 0.22592933626399425, "5": 0.1205845997228692, "1": 0.10895137469526749}, "score": 3.0038952440777846}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29985417674997006, "4": 0.23476060175920194, "2": 0.23375037652792163, "5": 0.13065150078719687, "1": 0.10097159897013826}, "score": 3.060370737932125}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3108580505804794, "4": 0.2462126218235928, "2": 0.2320700066575012, "5": 0.12277093217029211, "1": 0.08807644045681129}, "score": 3.0835325966665237}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30061776648498606, "4": 0.265146520034881, "2": 0.20817622966426508, "5": 0.1473754303539916, "1": 0.07866981832293615}, "score": 3.194384281519982}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2801517103128025, "4": 0.25302165526114445, "2": 0.21013552484768988, "5": 0.1574746163085583, "1": 0.09920535344182506}, "score": 3.15942643212995}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29357753524567287, "3": 0.2622127452362509, "1": 0.20076116726126267, "4": 0.1664997118822621, "5": 0.07694005244678348}, "score": 2.625276653965933}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2820209556469916, "3": 0.2785413379303253, "4": 0.1896344703580403, "1": 0.1547412054077596, "5": 0.09504987739011288}, "score": 2.7882282849576083}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2673083548158683, "2": 0.2650319484696206, "4": 0.19354458105492406, "1": 0.16851918131014373, "5": 0.10558541846099567}, "score": 2.802643031503142}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2812671639353246, "2": 0.2653548479113645, "4": 0.20381038554444994, "1": 0.13959127368882912, "5": 0.1099665445394822}, "score": 2.8792048974291395}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2861144423852643, "3": 0.27777959596763496, "4": 0.18085154095418673, "1": 0.1647730840145831, "5": 0.09046903875633436}, "score": 2.746125885928373}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26004494435547676, "2": 0.23777786059637696, "4": 0.21903408982023154, "1": 0.14773258465478073, "5": 0.13539390964241424}, "score": 2.9565781579219106}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2578199773033789, "4": 0.22790276734508214, "2": 0.22545650976321802, "5": 0.15060809701828193, "1": 0.13819468875109459}, "score": 3.027273563944509}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.25842628244437416, "2": 0.23494418586609697, "4": 0.2136666903258875, "1": 0.15260461776597642, "5": 0.1403378849739706}, "score": 2.954188107124929}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2667366064987279, "2": 0.2322775700104474, "4": 0.23159984558846305, "5": 0.14154093647908295, "1": 0.1278325595404306}, "score": 3.02673936321292}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2608517867017769, "2": 0.2359320356419628, "4": 0.20616189928620446, "5": 0.17043438415424714, "1": 0.12661284666160263}, "score": 3.0578733464950774}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28522538120338287, "4": 0.250274816217276, "2": 0.22234865746040783, "5": 0.14298713754578463, "1": 0.09915354209948796}, "score": 3.1155945594012784}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2975118865514007, "4": 0.25648692251962635, "2": 0.227564013988927, "5": 0.12884579207043478, "1": 0.08957802014290252}, "score": 3.1074598885578064}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2943870443673882, "4": 0.25104730285917054, "2": 0.23168798609737784, "5": 0.13428061861196916, "1": 0.0885881657239004}, "score": 3.110745206214527}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28663120200268977, "4": 0.2861668633527233, "2": 0.19395509806140163, "5": 0.16999577418094186, "1": 0.06324520275637206}, "score": 3.305714699520339}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2901333018679597, "4": 0.2640565220704456, "2": 0.20858849319364725, "5": 0.1555805927925913, "1": 0.08163225608184167}, "score": 3.2033664988366293}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29104447163470654, "3": 0.2783136677739288, "1": 0.17357725585486042, "4": 0.17269027619811295, "5": 0.0843585847354968}, "score": 2.703203789623643}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3010619564597536, "2": 0.2966987098578516, "4": 0.17817641927539973, "1": 0.14368690749988636, "5": 0.08036311312918444}, "score": 2.7548269594694066}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3039665550229607, "3": 0.3010045193181386, "4": 0.16889237521005104, "1": 0.14927031829428167, "5": 0.07685551871960482}, "score": 2.720093222274677}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.3030275662161269, "3": 0.2970344659329708, "4": 0.17213445369737768, "1": 0.14756867770593957, "5": 0.08022388423735327}, "score": 2.734414391794663}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.29079247806754643, "3": 0.27377931960683344, "4": 0.17392849717512426, "1": 0.17350337974268912, "5": 0.08798711461980746}, "score": 2.7121008370836597}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27551921690240117, "4": 0.23992557689518465, "2": 0.22840648692626217, "5": 0.14298193290870295, "1": 0.11314772648886916}, "score": 3.0711888596596113}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27143363711549073, "4": 0.2562305637978309, "2": 0.2138241993370563, "5": 0.1612958697810418, "1": 0.09720258239683408}, "score": 3.1705951821415863}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26999849339981924, "4": 0.23781607456898524, "2": 0.23042362876850264, "5": 0.14525237968657287, "1": 0.11649492140694742}, "score": 3.064908303670934}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2712856104443895, "4": 0.26803913044672634, "2": 0.20798404686222677, "5": 0.16600257146376532, "1": 0.08667667175247458}, "score": 3.2187095007477478}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2749153353973561, "4": 0.2662193462611908, "2": 0.21072139939346232, "5": 0.15985740178204721, "1": 0.08827354675543986}, "score": 3.1986682337294883}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2971948781405068, "4": 0.2491087826022799, "2": 0.22757011278622546, "5": 0.13068776160962176, "1": 0.09543138227090114}, "score": 3.092052080460683}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30776840828366375, "4": 0.25241604010438135, "2": 0.23670945930380974, "5": 0.11499280704613177, "1": 0.08810366028215888}, "score": 3.0694855431254697}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31514154244019227, "4": 0.2756430906289331, "2": 0.21191445497770875, "5": 0.13044619970760818, "1": 0.06684624149343646}, "score": 3.190930169401706}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3049341888254942, "4": 0.26625917565455576, "2": 0.22484009912034528, "5": 0.12664647949991917, "1": 0.07731104876749605}, "score": 3.1400911999591044}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3214589905661184, "4": 0.28686690971333306, "2": 0.21289410425954305, "5": 0.12254826825916793, "1": 0.05622034370223151}, "score": 3.2066310067516466}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2527347902360215, "2": 0.25223154095696554, "1": 0.1982652496726016, "4": 0.17850008528061648, "5": 0.11825846128059922}, "score": 2.7662526598519213}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.25812361006949525, "3": 0.25014858441714327, "1": 0.2056739975275082, "4": 0.1707815200346117, "5": 0.11525850543022916}, "score": 2.731823229618585}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2593101871733561, "3": 0.25002104116538426, "1": 0.2052451419233243, "4": 0.16824081556013018, "5": 0.11717267236205842}, "score": 2.732782979198453}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.26446239809539884, "3": 0.2510402234250504, "1": 0.20206767761409253, "4": 0.17020998470871818, "5": 0.11221111798806409}, "score": 2.7260321117391477}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2549224494197759, "3": 0.25227518078828765, "1": 0.1950539874536561, "4": 0.17836997046405753, "5": 0.11936880223253075}, "score": 2.772074960324067}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28215875653895267, "2": 0.2524541073134245, "4": 0.21870930616717538, "1": 0.13192944590656913, "5": 0.11473975672947508}, "score": 2.9318752327637334}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27885738297120816, "2": 0.2693355982016409, "4": 0.20326911260871514, "1": 0.15075082059099087, "5": 0.09778010969275906}, "score": 2.827990892686312}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2893316416033559, "2": 0.2856326598036362, "4": 0.1964793386540227, "1": 0.14590859718513605, "5": 0.0826410540113926}, "score": 2.7843101454952155}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2941028626133969, "2": 0.2746636557159696, "4": 0.21174264085191452, "1": 0.13016900947564417, "5": 0.08931407399414074}, "score": 2.855367992211986}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.29803677322678945, "3": 0.2853863222300685, "4": 0.17932885139893853, "1": 0.16026900408157252, "5": 0.07697142730149556}, "score": 2.7146947500835297}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "human", "scores": {"2": 0.289122761727392, "3": 0.2856023557860876, "4": 0.17041706890044686, "1": 0.1689877080730196, "5": 0.08585763168636984}, "score": 2.7150305997408464}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3012711768651997, "2": 0.26819286815651366, "4": 0.19888629489420112, "1": 0.13201236322317958, "5": 0.09962687713915826}, "score": 2.865921057504371}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.282811890564576, "2": 0.27288271267856545, "4": 0.19665617099433694, "1": 0.14649716532933948, "5": 0.10114114120246484}, "score": 2.8330595872011384}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2880365491866788, "2": 0.2597314152933624, "4": 0.21129631376844907, "1": 0.1264883588437134, "5": 0.1144341191710849}, "score": 2.92745545836902}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2890945158134066, "2": 0.27314281191753376, "4": 0.19437153938776047, "1": 0.14360708286671714, "5": 0.09977071256554365}, "score": 2.833553766899729}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "human", "scores": {"3": 0.282344534565348, "4": 0.2309775406062378, "2": 0.22401761316889712, "5": 0.14753971281750272, "1": 0.11510518689743833}, "score": 3.0718300863187786}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2667004394670668, "2": 0.22567625651629325, "4": 0.22302877053317777, "5": 0.1464587295161563, "1": 0.1381247937394893}, "score": 3.014020539939558}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2802351799394883, "4": 0.2344674750177703, "2": 0.22647264816599266, "5": 0.14147178232262006, "1": 0.11734105318806863}, "score": 3.0562569524051866}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2716613568331081, "2": 0.22662853762281243, "4": 0.22591257292917089, "5": 0.14277180393618907, "1": 0.13301502329956155}, "score": 3.0187977978171667}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2732750177088321, "4": 0.23495045895960504, "2": 0.22155531312884, "5": 0.1515620904559947, "1": 0.11864590618293498}, "score": 3.0792284028096337}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31974911701900754, "2": 0.2470155719523186, "4": 0.2369113875396263, "5": 0.10606371293638014, "1": 0.09025132503939243}, "score": 3.0215207826044828}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3076606774233111, "4": 0.24671910899877042, "2": 0.23369902721112745, "5": 0.12104946684832041, "1": 0.09086405414106341}, "score": 3.0733914697754714}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3274085171091483, "2": 0.24979052808598934, "4": 0.23669094934784088, "5": 0.1010435163481534, "1": 0.08505813628408249}, "score": 3.018871339018982}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.30666767793453004, "4": 0.2726716104437694, "2": 0.21362393989847625, "5": 0.138967456383611, "1": 0.06806298857404575}, "score": 3.200857876945123}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29691680418789895, "4": 0.25283302206071456, "2": 0.22047525778126084, "5": 0.13534570445463368, "1": 0.09441626707183179}, "score": 3.1142181175350445}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2780991706353475, "3": 0.25030034555050396, "1": 0.20657312769425915, "4": 0.1687287640187881, "5": 0.09628555224904299}, "score": 2.6700501399956473}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2674327890778064, "3": 0.2569596012558817, "4": 0.1858745676927656, "1": 0.1806023727382514, "5": 0.10911839429868189}, "score": 2.7754710656573836}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.27702021420169365, "3": 0.2549606906552098, "1": 0.18612486747494575, "4": 0.17887509679027647, "5": 0.10300931066830048}, "score": 2.7356211727198017}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.25921490818815573, "2": 0.256479535802627, "4": 0.2030890756251981, "1": 0.1605292516094099, "5": 0.12067404636180674}, "score": 2.8668973747136133}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.26046502183248577, "3": 0.2547659241251809, "4": 0.18964436953575928, "1": 0.17667395627877502, "5": 0.11844054195292149}, "score": 2.812710611270371}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.339021212436613, "2": 0.27612111142578843, "4": 0.22396311631342442, "1": 0.08668208921375303, "5": 0.07420438006688691}, "score": 2.922885962699428}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3144583638500112, "2": 0.28571587671739207, "4": 0.20167487660702405, "1": 0.12017315715479376, "5": 0.07797029173782498}, "score": 2.8315520168246815}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3258532344695441, "2": 0.2676033050752399, "4": 0.22263854433200742, "1": 0.0968112182889233, "5": 0.08708328668900676}, "score": 2.935578705357477}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3125039405891203, "4": 0.26167319529686156, "2": 0.2280913665080896, "5": 0.12068294036676369, "1": 0.07704168807985837}, "score": 3.120865163604646}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3186340861311321, "4": 0.2472349944768694, "2": 0.24680058910018624, "5": 0.10021255487768951, "1": 0.08710970305569905}, "score": 3.0266403240709088}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29550216960914805, "3": 0.2789291701001921, "4": 0.17594694117358745, "1": 0.1682301662535593, "5": 0.08138261530295429}, "score": 2.7067470486972187}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2892691816447288, "2": 0.2654711253389452, "4": 0.2112926372445753, "1": 0.12741892487201117, "5": 0.10653988040820157}, "score": 2.904062631447563}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2868949092900782, "2": 0.2822585172910632, "4": 0.1981392723197535, "1": 0.1432805761629471, "5": 0.08941966987773432}, "score": 2.8081575889988475}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29384833855431086, "2": 0.24355446156745553, "4": 0.2350076058600054, "5": 0.12255241046063793, "1": 0.10502957519100212}, "score": 3.026499016446053}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2836630468412357, "2": 0.2737953635450452, "4": 0.20054233648236122, "1": 0.14181360847352414, "5": 0.10017667518642995}, "score": 2.843471702387039}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28187011478924767, "2": 0.2490362277820305, "4": 0.21091857931513122, "1": 0.13403324671392, "5": 0.12412539181567873}, "score": 2.942065689320651}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2759088559138063, "2": 0.2593115615209901, "4": 0.20727265054701496, "1": 0.14159185791160506, "5": 0.11590474372603882}, "score": 2.896585792346774}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.277391531412799, "2": 0.23718638792344163, "4": 0.22388098170676843, "5": 0.13648345233785075, "1": 0.12504781435249737}, "score": 3.0095659638091403}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28840082873916606, "2": 0.2615402467640952, "4": 0.2124555901474535, "1": 0.12837388452024845, "5": 0.10922143977572261}, "score": 2.9126097538937765}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2620718175491683, "2": 0.24220303911152088, "4": 0.21367169018493928, "1": 0.14573228571086078, "5": 0.13630770665798256}, "score": 2.9526188551802335}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28498224468643885, "2": 0.2567293402032946, "4": 0.20420285335790628, "1": 0.14421525055212203, "5": 0.10985053608595234}, "score": 2.8787416863252613}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27701506167362816, "2": 0.2487342056086334, "4": 0.1999974025036877, "1": 0.15386481296245108, "5": 0.12035918483099488}, "score": 2.884248545361789}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28218765107499727, "2": 0.23238613868400826, "4": 0.22534250269539782, "5": 0.13861622993275086, "1": 0.12145447230054135}, "score": 3.027280234063773}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28246565810931035, "2": 0.25123781959698166, "4": 0.21187116527675035, "1": 0.13579397928532272, "5": 0.11862248779252563}, "score": 2.926289707414162}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2769702165654526, "2": 0.2453146271152366, "4": 0.21117574024750663, "1": 0.13912573310531834, "5": 0.12738920150420419}, "score": 2.9423866394707288}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3002197417358882, "2": 0.27172403633793235, "4": 0.19886771978172924, "1": 0.1368139780890614, "5": 0.09236044282069755}, "score": 2.838234335046776}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2854035315441546, "2": 0.27353179817069373, "4": 0.20746546228177815, "1": 0.13156229674996597, "5": 0.10202575475214128}, "score": 2.874859183981762}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.317885761916541, "2": 0.2723287235288921, "4": 0.2046100513169452, "1": 0.11492193582888523, "5": 0.09023990896885664}, "score": 2.8829156795622173}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2912308288382599, "4": 0.25017234966149415, "2": 0.2240157762320006, "5": 0.1400403757132139, "1": 0.0945347298838519}, "score": 3.117168561030943}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.308507199127918, "2": 0.2585493226360601, "4": 0.22239893617565418, "1": 0.10721268576357128, "5": 0.10332119963011896}, "score": 2.95606617308454}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2466416760241969, "3": 0.23998803765176524, "1": 0.19351448721242692, "4": 0.18375164289573329, "5": 0.1360872030267574}, "score": 2.822252385111266}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2521642041253971, "3": 0.23363673135487958, "1": 0.21334873469917515, "4": 0.17064691188230263, "5": 0.13019080159177962}, "score": 2.752163714753673}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.26345428961392897, "3": 0.24666155614444255, "1": 0.2030236914702607, "4": 0.1714663228295064, "5": 0.11538038654134605}, "score": 2.7327217473728904}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.24713327820620015, "2": 0.2420987205141109, "4": 0.19425666089510288, "1": 0.18393710508448616, "5": 0.13256201570463447}, "score": 2.8494059214225693}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.25662048437462437, "3": 0.24906168058512587, "1": 0.18810815293387986, "4": 0.18101953959126052, "5": 0.12517422651678992}, "score": 2.798527995754376}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29001332754670706, "4": 0.2537650094077715, "2": 0.21828812817037307, "5": 0.1460447058051294, "1": 0.09187991741473182}, "score": 3.1438077395831963}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27504317325038874, "4": 0.2416148136559585, "2": 0.21987114692764154, "5": 0.15240169709463885, "1": 0.11105458964050198}, "score": 3.104439404303666}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3101242361538153, "2": 0.24837991243668922, "4": 0.23234054899609302, "5": 0.10977293213668561, "1": 0.09937228769652429}, "score": 3.0047619734527062}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27906515331411613, "4": 0.2586469951595147, "2": 0.21100007290179348, "5": 0.16206629484859664, "1": 0.08921278679054218}, "score": 3.1933556199848416}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2926656639968123, "2": 0.24054148728739178, "4": 0.22952759891535715, "5": 0.12097214094726091, "1": 0.11627943061212524}, "score": 2.9983715100233588}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29419404863390997, "2": 0.2394459897713194, "4": 0.23393803649357534, "5": 0.11756930376457095, "1": 0.11484472274617762}, "score": 2.999941208294671}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2921414722606141, "2": 0.2489432550136728, "4": 0.22342555671204625, "1": 0.12191329300486774, "5": 0.11356635356190464}, "score": 2.9577879977609327}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30565202417609016, "2": 0.2584217600240027, "4": 0.2209892546808634, "1": 0.1156743689007927, "5": 0.09925150458332686}, "score": 2.9297209867938876}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29783828725148515, "2": 0.25009655892242355, "4": 0.22763994200808316, "1": 0.11522311497769365, "5": 0.10919327519838283}, "score": 2.9654833990339435}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3038040979312952, "4": 0.2397789312316184, "2": 0.2391253709361815, "5": 0.11286566192656555, "1": 0.10441215323623382}, "score": 3.0175608197474015}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30370595468314915, "2": 0.2451579946887882, "4": 0.23548119973175874, "5": 0.11546390600274431, "1": 0.10017624442765277}, "score": 3.020898835415771}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2999145434714564, "4": 0.25925060453865056, "2": 0.2180861741576741, "5": 0.14335732345873678, "1": 0.07937522397825271}, "score": 3.169131357497587}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2958044455244736, "4": 0.2501073133056748, "2": 0.22484781126800768, "5": 0.13724264340398395, "1": 0.09198266901045864}, "score": 3.1157812011455674}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3025871632624813, "4": 0.25737611022399254, "2": 0.22419304281068927, "5": 0.13401587713071922, "1": 0.08181247834521738}, "score": 3.137591974025304}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30294830457267974, "4": 0.25976476694821654, "2": 0.22139370318740795, "5": 0.14102061409989614, "1": 0.07485992338126746}, "score": 3.1706946109389484}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2691688503044904, "3": 0.259463173432964, "1": 0.20192139317795216, "4": 0.16713200996448038, "5": 0.10227647432179794}, "score": 2.6986618413259493}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2897796999589183, "3": 0.24831926546736852, "1": 0.19809372533687347, "4": 0.16168802047870304, "5": 0.10210615209949778}, "score": 2.679928969381164}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2648226294295107, "2": 0.26020869418279924, "4": 0.19079260091335437, "1": 0.16839733545716692, "5": 0.11575268381244146}, "score": 2.8252900511629093}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26816087465579286, "2": 0.23271794388021996, "4": 0.2223666017211061, "5": 0.14401360567720167, "1": 0.13272291099294853}, "score": 3.0122302681256157}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.26602028864701627, "3": 0.2639792968324816, "1": 0.18933663702606493, "4": 0.17423256356020958, "5": 0.10640347955763076}, "score": 2.7423388139039555}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2866036007469587, "4": 0.26050995592420584, "2": 0.20938351679505265, "5": 0.16314645249563772, "1": 0.08034849640833729}, "score": 3.2167240802482366}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2975412226696615, "4": 0.2611980361960421, "2": 0.21667546454340547, "5": 0.14789151215391433, "1": 0.07668457492697445}, "score": 3.186938163976644}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2982917334642897, "4": 0.2755886564940816, "2": 0.19896871055740156, "5": 0.16293151823236052, "1": 0.06420603946803216}, "score": 3.274074560108872}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27390178109891034, "4": 0.27242887721265996, "2": 0.19211246946347207, "5": 0.18866025011812848, "1": 0.07288845646767372}, "score": 3.311862541607078}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2716340019118184, "3": 0.27006046516504256, "2": 0.19240622246102115, "5": 0.1902589576070955, "1": 0.07563043480675674}, "score": 3.308487884649205}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29422449929373806, "4": 0.25694749874367895, "2": 0.2211779274060091, "5": 0.13985375632832947, "1": 0.08777820884297605}, "score": 3.1399232002315176}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.329052916738454, "4": 0.3054430296758211, "2": 0.19173106346250604, "5": 0.1336409169731481, "1": 0.040121994651025214}, "score": 3.3007528419947927}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32330966495573, "4": 0.27464382571589857, "2": 0.2118974389301775, "5": 0.12797948517215543, "1": 0.06215749953517136}, "score": 3.194392707429857}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.33125523434842047, "4": 0.2799639875436946, "2": 0.2106578554023208, "5": 0.1223440893033611, "1": 0.05576610675304237}, "score": 3.2024646739388833}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.32317154424748523, "3": 0.2780678306248596, "5": 0.2000339253638205, "2": 0.15697908485376655, "1": 0.041737816109016855}, "score": 3.4827894086606914}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2694731830209357, "2": 0.24280413244182808, "4": 0.21873900890772333, "1": 0.13767884722104254, "5": 0.13129516794343166}, "score": 2.9631671620883306}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2638165246063104, "2": 0.23631677666422646, "4": 0.21741972000807025, "1": 0.142053106764343, "5": 0.14038581854588075}, "score": 2.977768187864995}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.26786134547036305, "4": 0.23077750833155075, "2": 0.2265203030242821, "5": 0.15062359538884262, "1": 0.12420719256601549}, "score": 3.0570905850112546}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.270511788835041, "4": 0.2650035120671901, "2": 0.19754860967263432, "5": 0.1790533272342885, "1": 0.08787627673208338}, "score": 3.2498106235354633}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27122200142718905, "2": 0.22814844210784968, "4": 0.22627887052782406, "5": 0.14503990029018918, "1": 0.1293014214291323}, "score": 3.029607663394697}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3017184745065429, "2": 0.27424034103759537, "4": 0.2062633558969329, "1": 0.1264593457421246, "5": 0.0913112115414311}, "score": 2.861725741027737}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.310138099017004, "4": 0.2436164297044911, "2": 0.24156620564558073, "5": 0.11521812592482891, "1": 0.0894541030786031}, "score": 3.053578646764448}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3081530511850984, "2": 0.25242078557054254, "4": 0.22831082748615736, "5": 0.10896539763954786, "1": 0.10214157886807881}, "score": 2.989537592000662}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3026408469868497, "2": 0.25187236698333704, "4": 0.23224512310038642, "5": 0.10937033353908884, "1": 0.10386426256064939}, "score": 2.9913848371920397}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30727428309172405, "2": 0.2493447504872171, "4": 0.23993570196816716, "5": 0.11174039499613789, "1": 0.09169870701341387}, "score": 3.030674516476368}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.289068498477781, "2": 0.2733710087500917, "4": 0.18819125865757866, "1": 0.15975269751726245, "5": 0.08960407321909372}, "score": 2.7745201910710158}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28607444638200463, "2": 0.24186058835539997, "4": 0.2252596369628488, "5": 0.12367717940377254, "1": 0.12311631746834387}, "score": 2.9845205893347795}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2953099193621823, "2": 0.28219868482786276, "4": 0.18713950953184874, "1": 0.15039462592296146, "5": 0.08494646877530895}, "score": 2.774042071965661}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2859176347568889, "2": 0.24026675348851242, "4": 0.22967729970700487, "5": 0.12824717788098441, "1": 0.11587957194945543}, "score": 3.0141459216397686}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2899853136123609, "2": 0.2819251130135454, "4": 0.18601229598643235, "1": 0.1538799540049737, "5": 0.08818650784056908}, "score": 2.772697832247909}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29755089291653897, "2": 0.26369643628283845, "4": 0.21579659603176546, "1": 0.12480155040587222, "5": 0.09814375376194916}, "score": 2.8987834762982856}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2999426767750654, "2": 0.24078511072417086, "4": 0.23885070201609343, "5": 0.11401705916324563, "1": 0.10639119066543906}, "score": 3.0133175048863867}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29116196089119545, "2": 0.23906378017385915, "4": 0.23362077451106045, "5": 0.11898046012300818, "1": 0.117162865419808}, "score": 2.998192165378025}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.29888314541223415, "2": 0.25441810057201136, "4": 0.22324934347306463, "1": 0.12290541538951383, "5": 0.10053428151959141}, "score": 2.9240882377821653}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29092580789635464, "2": 0.24149116268401444, "4": 0.23797993870947964, "5": 0.11735313993900401, "1": 0.11224065584132953}, "score": 3.0067138066251755}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2787487612956789, "2": 0.235372456081882, "4": 0.22042475268528278, "5": 0.13463605902364653, "1": 0.1308054989422291}, "score": 2.9927133258870455}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2852990359052224, "2": 0.25413285437129735, "4": 0.20706500524819663, "1": 0.13798396447957195, "5": 0.11550937309214682}, "score": 2.9079820693717946}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2938753150699933, "4": 0.24766521111722326, "2": 0.21895015014167055, "5": 0.14737263024741595, "1": 0.092127084671628}, "score": 3.1392074897373834}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2895201446808959, "4": 0.2593381163844757, "2": 0.21621735588719568, "5": 0.14753040335534054, "1": 0.08738252142637233}, "score": 3.1634183968466307}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.26208895760650974, "4": 0.24649171416486307, "2": 0.20370400391549792, "5": 0.17820323684447215, "1": 0.10949526200745904}, "score": 3.180206691984095}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2699757334861695, "2": 0.24968007016498686, "4": 0.20900462459778524, "1": 0.1458127521392642, "5": 0.1255173353086449}, "score": 2.9187329500102215}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28300101352072343, "2": 0.2545053300471653, "4": 0.2184615396168553, "1": 0.12602411518327522, "5": 0.1179977998534552}, "score": 2.9479030474284778}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2814699462442006, "4": 0.24911182174796642, "2": 0.22946632322711516, "5": 0.14131671526550985, "1": 0.09862748536317796}, "score": 3.105024767872393}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2881604315356253, "4": 0.2566743290003499, "2": 0.22397099995386993, "5": 0.14352171947629558, "1": 0.08766615254459516}, "score": 3.144415382473278}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2896685038499723, "2": 0.2509139568536645, "4": 0.2203925509813072, "5": 0.11965978353767906, "1": 0.11935344045623489}, "score": 2.9700909284306083}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2936332909134491, "3": 0.26359100516032696, "1": 0.2234274781800963, "4": 0.13871895488050787, "5": 0.08060827235973277}, "score": 2.5594380011826057}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28790411163405744, "2": 0.27739269645967746, "1": 0.18884345265069982, "4": 0.15753472008921365, "5": 0.0883091634876129}, "score": 2.6790683567143296}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28857643176297787, "2": 0.26429943370399817, "4": 0.18042332205959657, "1": 0.15918931892536353, "5": 0.10749695042030644}, "score": 2.812736427947432}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2879399579273413, "2": 0.2793014261181009, "4": 0.17446795380870428, "1": 0.16621989475904653, "5": 0.09205484852113359}, "score": 2.746832405073841}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2848049554048518, "2": 0.2678297932623282, "4": 0.17569901323451326, "1": 0.17155792745336684, "5": 0.1000974867869125}, "score": 2.764945794445927}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2985565550325173, "2": 0.28760409923090996, "4": 0.17747422355863404, "1": 0.15175254168848923, "5": 0.08460052556813108}, "score": 2.755563145419959}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.29131369579633026, "3": 0.2839495208798408, "1": 0.1975511975763718, "4": 0.1493508862933245, "5": 0.07781307521726812}, "score": 2.6185526972719617}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3057664205657665, "2": 0.28682325189211916, "4": 0.17408525996142374, "1": 0.15623218701007463, "5": 0.07707650337871665}, "score": 2.728946201706519}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2860778220803885, "2": 0.2731565240308632, "4": 0.18808736813136215, "1": 0.15711720868994894, "5": 0.09555028744310132}, "score": 2.7917947551504265}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2858939617568068, "2": 0.2562184443787897, "4": 0.20370516503162941, "1": 0.1407723404815029, "5": 0.11340126869097106}, "score": 2.892743631107037}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29270195678925454, "2": 0.28412534004368273, "4": 0.17750020768695482, "1": 0.16062469856059022, "5": 0.08503599002896164}, "score": 2.74219440669759}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.29566219779949676, "3": 0.2859006803438512, "1": 0.18145762928425557, "4": 0.1598001670949514, "5": 0.0771678160051246}, "score": 2.6555543783498443}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2864365022576587, "2": 0.27878798400564614, "4": 0.1816434644077813, "1": 0.16277198866743822, "5": 0.0903498429667678}, "score": 2.758008716407736}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3081468265563334, "2": 0.2799801699298411, "4": 0.18194349629965434, "1": 0.1437785083515471, "5": 0.08614111977181883}, "score": 2.7866864418663466}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29500679175766537, "2": 0.2754306241687205, "4": 0.1861063675825786, "1": 0.15214930051315564, "5": 0.09129718721643407}, "score": 2.78896946375467}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28252416280505693, "2": 0.26041447047791577, "4": 0.19571444408934024, "1": 0.15165408624118182, "5": 0.10967805250938575}, "score": 2.8513457084610527}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28046938622315354, "2": 0.2603399765547758, "4": 0.20113446791463924, "1": 0.14848444109493789, "5": 0.10956242509221929}, "score": 2.8629491843542048}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28386542748660254, "2": 0.25956308598666816, "4": 0.20459165770013726, "1": 0.13883265389068092, "5": 0.11313569952478784}, "score": 2.893633442381704}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2904045291228645, "2": 0.25520893917749304, "4": 0.2080342186648061, "1": 0.13223132870838028, "5": 0.11410995247725135}, "score": 2.91658160676592}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2873033938940534, "2": 0.23953735584338728, "4": 0.22687032051612036, "5": 0.1274575386559402, "1": 0.11882184600834046}, "score": 3.0046043939172513}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3084737896074107, "4": 0.24846536982439543, "2": 0.23239922239191907, "5": 0.12350094143348023, "1": 0.08714920755005663}, "score": 3.0887706333268268}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3129204418950643, "4": 0.26803768303932995, "2": 0.22141396163805957, "5": 0.1272225454090626, "1": 0.07039577724024774}, "score": 3.1602787949372777}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31789399526439605, "4": 0.2686859375130127, "2": 0.21934402309442227, "5": 0.12290503438331671, "1": 0.07115898357094846}, "score": 3.152835854073887}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3164373193939841, "4": 0.26842678064661174, "2": 0.22563482615902006, "5": 0.1198746938130929, "1": 0.06961834282693477}, "score": 3.143305808231669}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3068567354765385, "4": 0.2669431672448405, "2": 0.22157481085428263, "5": 0.12894256581543914, "1": 0.07567256512599915}, "score": 3.1519099004878344}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27579823864283004, "2": 0.2481304904567767, "4": 0.22456906048904646, "1": 0.13067405318244846, "5": 0.1208205490401352}, "score": 2.956731232550693}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27369634966978973, "4": 0.26602701904545817, "2": 0.207340190978302, "5": 0.15987939967395268, "1": 0.0930505579195979}, "score": 3.192345758498196}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28195776183196253, "4": 0.2511992073115398, "2": 0.22809259820479427, "5": 0.13481447566911825, "1": 0.10392906290709587}, "score": 3.0848780197862657}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2759850172678219, "4": 0.2691931035104933, "2": 0.20113772631941249, "5": 0.16779966187478812, "1": 0.08587793941755824}, "score": 3.231900341426119}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.28394321727044763, "3": 0.2708392520397261, "5": 0.1864782441600707, "2": 0.18647645397751964, "1": 0.07225600075543218}, "score": 3.325913476676853}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2958219872482002, "2": 0.2724387393165181, "4": 0.2026949782759574, "1": 0.1369173937964395, "5": 0.09212084787911357}, "score": 2.8406621825758958}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3106765314109696, "2": 0.24787913759927474, "4": 0.232724576436134, "5": 0.11060201182056296, "1": 0.0981123135402363}, "score": 3.0098248887387284}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3204361315547809, "4": 0.25306363503587836, "2": 0.23238953154640085, "5": 0.11295364112258212, "1": 0.08115318804211846}, "score": 3.0842753360233504}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3114257599433204, "4": 0.2692724733359457, "2": 0.21354292770300687, "5": 0.13598958188052182, "1": 0.06976470891577002}, "score": 3.188180147447423}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3146728661345627, "2": 0.25297168841861856, "4": 0.22693455659604658, "5": 0.10493641328802752, "1": 0.10047865119188376}, "score": 2.982878292646542}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2698580497232941, "2": 0.24990610791583537, "4": 0.2089127245741836, "1": 0.14595868160968567, "5": 0.12535497077481744}, "score": 2.9177984169175675}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27707933662354234, "4": 0.243546521821427, "2": 0.22642869409086466, "5": 0.14357477490785378, "1": 0.10935891587227993}, "score": 3.085550551592514}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27752246336743763, "2": 0.23829616218019845, "4": 0.2321486220815266, "5": 0.13110032620506235, "1": 0.12092233487539285}, "score": 3.014208585943634}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2893621966379866, "4": 0.2591867589776563, "2": 0.21858292871481289, "5": 0.14462971390717322, "1": 0.08822843285043505}, "score": 3.1534079216863815}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2884923816908927, "4": 0.2376978380370525, "2": 0.23664699991937774, "5": 0.1312667193630533, "1": 0.10588616256720224}, "score": 3.051812464571038}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32778912137453253, "2": 0.28856970801044984, "4": 0.20319879366163188, "1": 0.10670839982657729, "5": 0.073722561532929}, "score": 2.848655681378608}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31984256136255423, "2": 0.27247963544046677, "4": 0.2110843209456866, "1": 0.1081334031235812, "5": 0.0884492091169234}, "score": 2.899235202177465}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31756406546890953, "2": 0.2569157933785952, "4": 0.22696839506102987, "5": 0.10372656758320871, "1": 0.09481051103223288}, "score": 2.987884537081124}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3234381737495895, "2": 0.2608677252328615, "4": 0.22451389064877672, "1": 0.10226702441216313, "5": 0.08890537296385638}, "score": 2.9369223696942335}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30474671195441344, "4": 0.2408497461215716, "2": 0.23709129524923975, "5": 0.11830479219319967, "1": 0.09899489458755431}, "score": 3.0423787783565874}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2784824605150489, "2": 0.26220852364503644, "4": 0.19914015613024189, "1": 0.14851916081584307, "5": 0.11163786438228361}, "score": 2.8631674202713415}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2747667013782345, "2": 0.2718537068060997, "4": 0.18609561094540214, "1": 0.1653978822968843, "5": 0.10186758452592462}, "score": 2.7871773683890826}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29566731279976327, "2": 0.24711938970623548, "4": 0.2282675210299305, "5": 0.12256442118537896, "1": 0.10637173349607874}, "score": 3.013533636920008}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28055979607509823, "2": 0.250972727784167, "4": 0.21570222724062038, "1": 0.1322444996046194, "5": 0.12051154759246822}, "score": 2.941263054952226}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27211372321784794, "2": 0.2519425987891108, "4": 0.21496385097301113, "1": 0.1370384000627177, "5": 0.12393217981221077}, "score": 2.9368082273393954}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29022592720013257, "2": 0.27035112551106005, "4": 0.18274597595367773, "1": 0.16814136417159015, "5": 0.08852201507444826}, "score": 2.75315279707916}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29553254879364727, "2": 0.27639134524679865, "4": 0.18466778961016142, "1": 0.1582550827484533, "5": 0.08514276016282267}, "score": 2.7620493070302445}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2955526161349889, "2": 0.2741795486930677, "4": 0.1850470059429741, "1": 0.1587359260408814, "5": 0.0864741027537961}, "score": 2.7663412870601602}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3066845757891158, "2": 0.2727479964592167, "4": 0.19338147238675743, "1": 0.14494878584800291, "5": 0.0822260843005787}, "score": 2.7951858024230054}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29766267402309604, "2": 0.2935569268260626, "4": 0.17720564228156385, "1": 0.16183886487807, "5": 0.06972428500646301}, "score": 2.6994160668391607}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27777134603614684, "2": 0.23758636013041662, "4": 0.22212701968237078, "1": 0.13229423288574166, "5": 0.1302064514666696}, "score": 2.9803648102403444}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28773150729889324, "2": 0.23765541275953153, "4": 0.23332382113549158, "5": 0.1279045623251893, "1": 0.11337164081051332}, "score": 3.0247345743317613}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28177415435335335, "4": 0.25007460140849913, "2": 0.22048054925094496, "5": 0.14669644899830883, "1": 0.10096453120558499}, "score": 3.1210590638055744}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2917117855331168, "4": 0.26272505812278346, "2": 0.2147733699623062, "5": 0.14650350879393328, "1": 0.08427733595519482}, "score": 3.1724055754252793}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2964852526181682, "4": 0.2457864523321444, "2": 0.23133934973075063, "5": 0.1296785607616023, "1": 0.09669924347272266}, "score": 3.080406632996255}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28499353020678025, "2": 0.2622520538728705, "4": 0.19961627107807306, "1": 0.14835240807313535, "5": 0.10477208574182172}, "score": 2.850201527639537}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28668300094078475, "2": 0.25847487115266915, "4": 0.21381164822493393, "1": 0.1279494519115265, "5": 0.11306930835688095}, "score": 2.9255756177528855}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.276246692243789, "2": 0.24211956611133728, "4": 0.22110170051289205, "1": 0.13141836744682178, "5": 0.12910162423404098}, "score": 2.9743483388875562}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2813741501799142, "2": 0.24670438030761901, "4": 0.21688318247529917, "5": 0.12820281203317188, "1": 0.12682381996600386}, "score": 2.972936470875556}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2855412148670827, "2": 0.2628643130234102, "4": 0.2057182427627808, "1": 0.13649061790719302, "5": 0.10937269596380735}, "score": 2.8886166472836106}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3352233677319121, "2": 0.304295442252837, "4": 0.1959936927728021, "1": 0.08820893652119885, "5": 0.07626658339454058}, "score": 2.8678119610073183}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3268149403290907, "2": 0.2735728857323776, "4": 0.2224127698197062, "5": 0.09258996616041495, "1": 0.08459517898386902}, "score": 2.964828956937412}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3188082353690332, "2": 0.3131110058618756, "4": 0.19048350044569973, "1": 0.10108535702434386, "5": 0.07649908492392102}, "score": 2.828197748500876}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3197161525843887, "2": 0.2689261963596456, "4": 0.23352461263447483, "1": 0.08954334224757697, "5": 0.0882792670666057}, "score": 2.962069870335495}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2863695412314799, "2": 0.2777008010738431, "4": 0.21579109328872692, "1": 0.12620158115393307, "5": 0.09392575962358539}, "score": 2.873537229783045}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2830788211935149, "2": 0.24608250822375094, "4": 0.2258369500597289, "5": 0.12283413863386822, "1": 0.12215868288674674}, "score": 2.9811051851852186}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28137960889137703, "2": 0.23878509873927226, "4": 0.23770223548773245, "5": 0.13098800825620485, "1": 0.1111354334768457}, "score": 3.03862265766977}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2790193345777632, "4": 0.23954032612501544, "2": 0.23270332965223584, "5": 0.14093241919395827, "1": 0.10779170193007521}, "score": 3.073119373401122}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2840840880392764, "2": 0.23825880027121882, "4": 0.23633206685430896, "5": 0.13061309489190864, "1": 0.11070348038162738}, "score": 3.0378928165391987}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2841263344841131, "4": 0.2531374897794649, "2": 0.2266000295459751, "5": 0.13919875153218775, "1": 0.09692907049205252}, "score": 3.1110777469433875}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26762937090653954, "2": 0.2502147324472474, "4": 0.20522987225280395, "1": 0.14600910444583617, "5": 0.13090392785300584}, "score": 2.9248038096638798}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2636204762821089, "4": 0.23026786897904925, "2": 0.23004749301633082, "5": 0.14909920339235438, "1": 0.1269536779003282}, "score": 3.044511929060463}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2796433046200228, "2": 0.2334765582141641, "4": 0.23281796426854673, "5": 0.1412554112436255, "1": 0.11279660927373354}, "score": 3.0562595811628075}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28229397118729305, "4": 0.2356082525539597, "2": 0.234043332299777, "5": 0.13686875568749532, "1": 0.11117380405086194}, "score": 3.0529554528617333}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27514559088765006, "4": 0.24211542590215565, "2": 0.2249917374267014, "5": 0.15317284336792122, "1": 0.1045646435778039}, "score": 3.1143412038929474}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2857943736497863, "2": 0.2672278269406959, "4": 0.19557444093225398, "1": 0.14129941915810473, "5": 0.1100885981118377}, "score": 2.865922914994666}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2987421954781986, "2": 0.249512291618509, "4": 0.2190752940076591, "5": 0.11995435302807175, "1": 0.11270214784989975}, "score": 2.9840671941789823}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3002153585596561, "2": 0.25206424083749285, "4": 0.2232415745310921, "5": 0.11495064691432053, "1": 0.10951880601968125}, "score": 2.9820408471492645}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2913614460240955, "2": 0.24145547292770772, "4": 0.22825252434644525, "5": 0.12988531632416672, "1": 0.10903551763152664}, "score": 3.0284969258723917}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2863805666710556, "2": 0.251149474792174, "4": 0.2160959623106363, "5": 0.12434839698124663, "1": 0.12201215598392955}, "score": 2.969618561087485}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2701131861132399, "3": 0.25312283354310877, "1": 0.1919869841764324, "4": 0.1735152824827988, "5": 0.111249483571555}, "score": 2.741923938860449}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.2635076708603424, "3": 0.25672543794698066, "4": 0.1842459553723075, "1": 0.1743224907622295, "5": 0.12117764131063982}, "score": 2.814444725363705}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.2683191630863354, "3": 0.2553481936320136, "4": 0.183689380014997, "1": 0.17861641597678635, "5": 0.11401835896512895}, "score": 2.7861722878662887}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.26730918347305266, "2": 0.25562634259333455, "4": 0.20579525751345837, "1": 0.14334169836206304, "5": 0.12791823605374963}, "score": 2.91932124144291}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.26444906952641767, "3": 0.2502020468818941, "4": 0.18400281915425645, "1": 0.1801251125173591, "5": 0.12120945461679761}, "score": 2.8017201541431946}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2740201870343808, "2": 0.2579981666741278, "4": 0.19605912638771242, "1": 0.16448103568699932, "5": 0.10743073120369338}, "score": 2.8239584577699652}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2766884596894296, "2": 0.2564529915443605, "4": 0.19965761588892075, "1": 0.15960442001824562, "5": 0.1075891578292643}, "score": 2.8391729170786135}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27814948332596107, "2": 0.2496561269943514, "4": 0.20759450442126842, "1": 0.1482284521098395, "5": 0.11636115724727823}, "score": 2.894202700539187}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2812983300636603, "2": 0.24731152555023267, "4": 0.2085143323120538, "1": 0.1411179942366966, "5": 0.12174996554712143}, "score": 2.9224661405643038}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2793093583912403, "2": 0.2617415532626348, "4": 0.19043537134650493, "1": 0.16149130124986272, "5": 0.10701318797632092}, "score": 2.8197359281007723}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2762398966587459, "2": 0.263845994557975, "4": 0.1851233165538758, "1": 0.162270140271229, "5": 0.11250053520176007}, "score": 2.8217345257338398}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.27601214792846945, "3": 0.2721847813872204, "1": 0.18064586702610885, "4": 0.1710930873718132, "5": 0.10003231451942089}, "score": 2.733845370242455}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29409248096558377, "2": 0.2690972609121207, "4": 0.19129847009124107, "1": 0.14716430430834462, "5": 0.09832786726411921}, "score": 2.8245248928904974}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.28724510594894426, "2": 0.2684839079436622, "4": 0.19232931382834131, "1": 0.14207573762675088, "5": 0.10984730652766611}, "score": 2.859385924309983}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2786295380792609, "2": 0.27103695556529833, "4": 0.1830359678179435, "1": 0.16527503731290064, "5": 0.10200339315761989}, "score": 2.7854516243373517}]